2 * OpenEXR (.exr) image decoder
3 * Copyright (c) 2006 Industrial Light & Magic, a division of Lucas Digital Ltd. LLC
4 * Copyright (c) 2009 Jimmy Christensen
6 * B44/B44A, Tile, UINT32 added by Jokyo Images support by CNC - French National Center for Cinema
8 * This file is part of FFmpeg.
10 * FFmpeg is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU Lesser General Public
12 * License as published by the Free Software Foundation; either
13 * version 2.1 of the License, or (at your option) any later version.
15 * FFmpeg is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 * Lesser General Public License for more details.
20 * You should have received a copy of the GNU Lesser General Public
21 * License along with FFmpeg; if not, write to the Free Software
22 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
28 * @author Jimmy Christensen
30 * For more information on the OpenEXR format, visit:
37 #include "libavutil/avassert.h"
38 #include "libavutil/common.h"
39 #include "libavutil/imgutils.h"
40 #include "libavutil/intfloat.h"
41 #include "libavutil/avstring.h"
42 #include "libavutil/opt.h"
43 #include "libavutil/color_utils.h"
46 #include "bytestream.h"
55 #include "half2float.h"
80 enum ExrTileLevelMode {
82 EXR_TILE_LEVEL_MIPMAP,
83 EXR_TILE_LEVEL_RIPMAP,
84 EXR_TILE_LEVEL_UNKNOWN,
87 enum ExrTileLevelRound {
90 EXR_TILE_ROUND_UNKNOWN,
93 typedef struct HuffEntry {
99 typedef struct EXRChannel {
101 enum ExrPixelType pixel_type;
104 typedef struct EXRTileAttribute {
107 enum ExrTileLevelMode level_mode;
108 enum ExrTileLevelRound level_round;
111 typedef struct EXRThreadData {
112 uint8_t *uncompressed_data;
113 int uncompressed_size;
130 uint8_t *rle_raw_data;
131 unsigned rle_raw_size;
137 int channel_line_size;
145 typedef struct EXRContext {
148 AVCodecContext *avctx;
152 BswapDSPContext bbdsp;
155 enum ExrCompr compression;
156 enum ExrPixelType pixel_type;
157 int channel_offsets[4]; // 0 = red, 1 = green, 2 = blue and 3 = alpha
158 const AVPixFmtDescriptor *desc;
164 uint32_t xdelta, ydelta;
166 int scan_lines_per_block;
168 EXRTileAttribute tile_attr; /* header data attribute of tile */
169 int is_tile; /* 0 if scanline, 1 if tile */
173 int is_luma;/* 1 if there is an Y plane */
179 EXRChannel *channels;
181 int current_channel_offset;
182 uint32_t chunk_count;
184 EXRThreadData *thread_data;
189 enum AVColorTransferCharacteristic apply_trc_type;
191 union av_intfloat32 gamma_table[65536];
193 uint32_t mantissatable[2048];
194 uint32_t exponenttable[64];
195 uint16_t offsettable[64];
198 static int zip_uncompress(EXRContext *s, const uint8_t *src, int compressed_size,
199 int uncompressed_size, EXRThreadData *td)
201 unsigned long dest_len = uncompressed_size;
203 if (uncompress(td->tmp, &dest_len, src, compressed_size) != Z_OK ||
204 dest_len != uncompressed_size)
205 return AVERROR_INVALIDDATA;
207 av_assert1(uncompressed_size % 2 == 0);
209 s->dsp.predictor(td->tmp, uncompressed_size);
210 s->dsp.reorder_pixels(td->uncompressed_data, td->tmp, uncompressed_size);
215 static int rle(uint8_t *dst, const uint8_t *src,
216 int compressed_size, int uncompressed_size)
219 const int8_t *s = src;
220 int ssize = compressed_size;
221 int dsize = uncompressed_size;
222 uint8_t *dend = d + dsize;
231 if ((dsize -= count) < 0 ||
232 (ssize -= count + 1) < 0)
233 return AVERROR_INVALIDDATA;
240 if ((dsize -= count) < 0 ||
242 return AVERROR_INVALIDDATA;
252 return AVERROR_INVALIDDATA;
257 static int rle_uncompress(EXRContext *ctx, const uint8_t *src, int compressed_size,
258 int uncompressed_size, EXRThreadData *td)
260 rle(td->tmp, src, compressed_size, uncompressed_size);
262 av_assert1(uncompressed_size % 2 == 0);
264 ctx->dsp.predictor(td->tmp, uncompressed_size);
265 ctx->dsp.reorder_pixels(td->uncompressed_data, td->tmp, uncompressed_size);
270 #define USHORT_RANGE (1 << 16)
271 #define BITMAP_SIZE (1 << 13)
273 static uint16_t reverse_lut(const uint8_t *bitmap, uint16_t *lut)
277 for (i = 0; i < USHORT_RANGE; i++)
278 if ((i == 0) || (bitmap[i >> 3] & (1 << (i & 7))))
283 memset(lut + k, 0, (USHORT_RANGE - k) * 2);
288 static void apply_lut(const uint16_t *lut, uint16_t *dst, int dsize)
292 for (i = 0; i < dsize; ++i)
293 dst[i] = lut[dst[i]];
296 #define HUF_ENCBITS 16 // literal (value) bit length
297 #define HUF_ENCSIZE ((1 << HUF_ENCBITS) + 1) // encoding table size
299 static void huf_canonical_code_table(uint64_t *freq)
301 uint64_t c, n[59] = { 0 };
304 for (i = 0; i < HUF_ENCSIZE; i++)
308 for (i = 58; i > 0; --i) {
309 uint64_t nc = ((c + n[i]) >> 1);
314 for (i = 0; i < HUF_ENCSIZE; ++i) {
318 freq[i] = l | (n[l]++ << 6);
322 #define SHORT_ZEROCODE_RUN 59
323 #define LONG_ZEROCODE_RUN 63
324 #define SHORTEST_LONG_RUN (2 + LONG_ZEROCODE_RUN - SHORT_ZEROCODE_RUN)
325 #define LONGEST_LONG_RUN (255 + SHORTEST_LONG_RUN)
327 static int huf_unpack_enc_table(GetByteContext *gb,
328 int32_t im, int32_t iM, uint64_t *freq)
331 int ret = init_get_bits8(&gbit, gb->buffer, bytestream2_get_bytes_left(gb));
335 for (; im <= iM; im++) {
336 uint64_t l = freq[im] = get_bits(&gbit, 6);
338 if (l == LONG_ZEROCODE_RUN) {
339 int zerun = get_bits(&gbit, 8) + SHORTEST_LONG_RUN;
341 if (im + zerun > iM + 1)
342 return AVERROR_INVALIDDATA;
348 } else if (l >= SHORT_ZEROCODE_RUN) {
349 int zerun = l - SHORT_ZEROCODE_RUN + 2;
351 if (im + zerun > iM + 1)
352 return AVERROR_INVALIDDATA;
361 bytestream2_skip(gb, (get_bits_count(&gbit) + 7) / 8);
362 huf_canonical_code_table(freq);
367 static int huf_build_dec_table(EXRContext *s,
368 EXRThreadData *td, int im, int iM)
373 for (int i = im; i < iM; i++) {
375 td->he[j].len = td->freq[i] & 63;
376 td->he[j].code = td->freq[i] >> 6;
377 if (td->he[j].len > 32) {
378 avpriv_request_sample(s->avctx, "Too big code length");
379 return AVERROR_PATCHWELCOME;
381 if (td->he[j].len > 0)
392 if (td->run_sym == -1) {
393 avpriv_request_sample(s->avctx, "No place for run symbol");
394 return AVERROR_PATCHWELCOME;
397 td->he[j].sym = td->run_sym;
398 td->he[j].len = td->freq[iM] & 63;
399 if (td->he[j].len > 32) {
400 avpriv_request_sample(s->avctx, "Too big code length");
401 return AVERROR_PATCHWELCOME;
403 td->he[j].code = td->freq[iM] >> 6;
406 ff_free_vlc(&td->vlc);
407 return ff_init_vlc_sparse(&td->vlc, 12, j,
408 &td->he[0].len, sizeof(td->he[0]), sizeof(td->he[0].len),
409 &td->he[0].code, sizeof(td->he[0]), sizeof(td->he[0].code),
410 &td->he[0].sym, sizeof(td->he[0]), sizeof(td->he[0].sym), 0);
413 static int huf_decode(VLC *vlc, GetByteContext *gb, int nbits, int run_sym,
414 int no, uint16_t *out)
419 init_get_bits(&gbit, gb->buffer, nbits);
420 while (get_bits_left(&gbit) > 0 && oe < no) {
421 uint16_t x = get_vlc2(&gbit, vlc->table, 12, 2);
424 int run = get_bits(&gbit, 8);
425 uint16_t fill = out[oe - 1];
437 static int huf_uncompress(EXRContext *s,
440 uint16_t *dst, int dst_size)
446 im = bytestream2_get_le32(gb);
447 iM = bytestream2_get_le32(gb);
448 bytestream2_skip(gb, 4);
449 nBits = bytestream2_get_le32(gb);
450 if (im < 0 || im >= HUF_ENCSIZE ||
451 iM < 0 || iM >= HUF_ENCSIZE)
452 return AVERROR_INVALIDDATA;
454 bytestream2_skip(gb, 4);
457 td->freq = av_malloc_array(HUF_ENCSIZE, sizeof(*td->freq));
459 td->he = av_calloc(HUF_ENCSIZE, sizeof(*td->he));
460 if (!td->freq || !td->he) {
461 ret = AVERROR(ENOMEM);
465 memset(td->freq, 0, sizeof(*td->freq) * HUF_ENCSIZE);
466 if ((ret = huf_unpack_enc_table(gb, im, iM, td->freq)) < 0)
469 if (nBits > 8 * bytestream2_get_bytes_left(gb)) {
470 ret = AVERROR_INVALIDDATA;
474 if ((ret = huf_build_dec_table(s, td, im, iM)) < 0)
476 return huf_decode(&td->vlc, gb, nBits, td->run_sym, dst_size, dst);
479 static inline void wdec14(uint16_t l, uint16_t h, uint16_t *a, uint16_t *b)
484 int ai = ls + (hi & 1) + (hi >> 1);
486 int16_t bs = ai - hi;
493 #define A_OFFSET (1 << (NBITS - 1))
494 #define MOD_MASK ((1 << NBITS) - 1)
496 static inline void wdec16(uint16_t l, uint16_t h, uint16_t *a, uint16_t *b)
500 int bb = (m - (d >> 1)) & MOD_MASK;
501 int aa = (d + bb - A_OFFSET) & MOD_MASK;
506 static void wav_decode(uint16_t *in, int nx, int ox,
507 int ny, int oy, uint16_t mx)
509 int w14 = (mx < (1 << 14));
510 int n = (nx > ny) ? ny : nx;
523 uint16_t *ey = in + oy * (ny - p2);
524 uint16_t i00, i01, i10, i11;
530 for (; py <= ey; py += oy2) {
532 uint16_t *ex = py + ox * (nx - p2);
534 for (; px <= ex; px += ox2) {
535 uint16_t *p01 = px + ox1;
536 uint16_t *p10 = px + oy1;
537 uint16_t *p11 = p10 + ox1;
540 wdec14(*px, *p10, &i00, &i10);
541 wdec14(*p01, *p11, &i01, &i11);
542 wdec14(i00, i01, px, p01);
543 wdec14(i10, i11, p10, p11);
545 wdec16(*px, *p10, &i00, &i10);
546 wdec16(*p01, *p11, &i01, &i11);
547 wdec16(i00, i01, px, p01);
548 wdec16(i10, i11, p10, p11);
553 uint16_t *p10 = px + oy1;
556 wdec14(*px, *p10, &i00, p10);
558 wdec16(*px, *p10, &i00, p10);
566 uint16_t *ex = py + ox * (nx - p2);
568 for (; px <= ex; px += ox2) {
569 uint16_t *p01 = px + ox1;
572 wdec14(*px, *p01, &i00, p01);
574 wdec16(*px, *p01, &i00, p01);
585 static int piz_uncompress(EXRContext *s, const uint8_t *src, int ssize,
586 int dsize, EXRThreadData *td)
589 uint16_t maxval, min_non_zero, max_non_zero;
591 uint16_t *tmp = (uint16_t *)td->tmp;
595 int pixel_half_size;/* 1 for half, 2 for float and uint32 */
600 td->bitmap = av_malloc(BITMAP_SIZE);
602 td->lut = av_malloc(1 << 17);
603 if (!td->bitmap || !td->lut) {
604 av_freep(&td->bitmap);
606 return AVERROR(ENOMEM);
609 bytestream2_init(&gb, src, ssize);
610 min_non_zero = bytestream2_get_le16(&gb);
611 max_non_zero = bytestream2_get_le16(&gb);
613 if (max_non_zero >= BITMAP_SIZE)
614 return AVERROR_INVALIDDATA;
616 memset(td->bitmap, 0, FFMIN(min_non_zero, BITMAP_SIZE));
617 if (min_non_zero <= max_non_zero)
618 bytestream2_get_buffer(&gb, td->bitmap + min_non_zero,
619 max_non_zero - min_non_zero + 1);
620 memset(td->bitmap + max_non_zero + 1, 0, BITMAP_SIZE - max_non_zero - 1);
622 maxval = reverse_lut(td->bitmap, td->lut);
624 bytestream2_skip(&gb, 4);
625 ret = huf_uncompress(s, td, &gb, tmp, dsize / sizeof(uint16_t));
630 for (i = 0; i < s->nb_channels; i++) {
631 channel = &s->channels[i];
633 if (channel->pixel_type == EXR_HALF)
638 for (j = 0; j < pixel_half_size; j++)
639 wav_decode(ptr + j, td->xsize, pixel_half_size, td->ysize,
640 td->xsize * pixel_half_size, maxval);
641 ptr += td->xsize * td->ysize * pixel_half_size;
644 apply_lut(td->lut, tmp, dsize / sizeof(uint16_t));
646 out = (uint16_t *)td->uncompressed_data;
647 for (i = 0; i < td->ysize; i++) {
649 for (j = 0; j < s->nb_channels; j++) {
650 channel = &s->channels[j];
651 if (channel->pixel_type == EXR_HALF)
656 in = tmp + tmp_offset * td->xsize * td->ysize + i * td->xsize * pixel_half_size;
657 tmp_offset += pixel_half_size;
660 s->bbdsp.bswap16_buf(out, in, td->xsize * pixel_half_size);
662 memcpy(out, in, td->xsize * 2 * pixel_half_size);
664 out += td->xsize * pixel_half_size;
671 static int pxr24_uncompress(EXRContext *s, const uint8_t *src,
672 int compressed_size, int uncompressed_size,
675 unsigned long dest_len, expected_len = 0;
676 const uint8_t *in = td->tmp;
680 for (i = 0; i < s->nb_channels; i++) {
681 if (s->channels[i].pixel_type == EXR_FLOAT) {
682 expected_len += (td->xsize * td->ysize * 3);/* PRX 24 store float in 24 bit instead of 32 */
683 } else if (s->channels[i].pixel_type == EXR_HALF) {
684 expected_len += (td->xsize * td->ysize * 2);
686 expected_len += (td->xsize * td->ysize * 4);
690 dest_len = expected_len;
692 if (uncompress(td->tmp, &dest_len, src, compressed_size) != Z_OK) {
693 return AVERROR_INVALIDDATA;
694 } else if (dest_len != expected_len) {
695 return AVERROR_INVALIDDATA;
698 out = td->uncompressed_data;
699 for (i = 0; i < td->ysize; i++)
700 for (c = 0; c < s->nb_channels; c++) {
701 EXRChannel *channel = &s->channels[c];
702 const uint8_t *ptr[4];
705 switch (channel->pixel_type) {
708 ptr[1] = ptr[0] + td->xsize;
709 ptr[2] = ptr[1] + td->xsize;
710 in = ptr[2] + td->xsize;
712 for (j = 0; j < td->xsize; ++j) {
713 uint32_t diff = ((unsigned)*(ptr[0]++) << 24) |
714 (*(ptr[1]++) << 16) |
717 bytestream_put_le32(&out, pixel);
722 ptr[1] = ptr[0] + td->xsize;
723 in = ptr[1] + td->xsize;
724 for (j = 0; j < td->xsize; j++) {
725 uint32_t diff = (*(ptr[0]++) << 8) | *(ptr[1]++);
728 bytestream_put_le16(&out, pixel);
733 ptr[1] = ptr[0] + s->xdelta;
734 ptr[2] = ptr[1] + s->xdelta;
735 ptr[3] = ptr[2] + s->xdelta;
736 in = ptr[3] + s->xdelta;
738 for (j = 0; j < s->xdelta; ++j) {
739 uint32_t diff = ((uint32_t)*(ptr[0]++) << 24) |
740 (*(ptr[1]++) << 16) |
741 (*(ptr[2]++) << 8 ) |
744 bytestream_put_le32(&out, pixel);
748 return AVERROR_INVALIDDATA;
755 static void unpack_14(const uint8_t b[14], uint16_t s[16])
757 unsigned short shift = (b[ 2] >> 2) & 15;
758 unsigned short bias = (0x20 << shift);
761 s[ 0] = (b[0] << 8) | b[1];
763 s[ 4] = s[ 0] + ((((b[ 2] << 4) | (b[ 3] >> 4)) & 0x3f) << shift) - bias;
764 s[ 8] = s[ 4] + ((((b[ 3] << 2) | (b[ 4] >> 6)) & 0x3f) << shift) - bias;
765 s[12] = s[ 8] + ((b[ 4] & 0x3f) << shift) - bias;
767 s[ 1] = s[ 0] + ((b[ 5] >> 2) << shift) - bias;
768 s[ 5] = s[ 4] + ((((b[ 5] << 4) | (b[ 6] >> 4)) & 0x3f) << shift) - bias;
769 s[ 9] = s[ 8] + ((((b[ 6] << 2) | (b[ 7] >> 6)) & 0x3f) << shift) - bias;
770 s[13] = s[12] + ((b[ 7] & 0x3f) << shift) - bias;
772 s[ 2] = s[ 1] + ((b[ 8] >> 2) << shift) - bias;
773 s[ 6] = s[ 5] + ((((b[ 8] << 4) | (b[ 9] >> 4)) & 0x3f) << shift) - bias;
774 s[10] = s[ 9] + ((((b[ 9] << 2) | (b[10] >> 6)) & 0x3f) << shift) - bias;
775 s[14] = s[13] + ((b[10] & 0x3f) << shift) - bias;
777 s[ 3] = s[ 2] + ((b[11] >> 2) << shift) - bias;
778 s[ 7] = s[ 6] + ((((b[11] << 4) | (b[12] >> 4)) & 0x3f) << shift) - bias;
779 s[11] = s[10] + ((((b[12] << 2) | (b[13] >> 6)) & 0x3f) << shift) - bias;
780 s[15] = s[14] + ((b[13] & 0x3f) << shift) - bias;
782 for (i = 0; i < 16; ++i) {
790 static void unpack_3(const uint8_t b[3], uint16_t s[16])
794 s[0] = (b[0] << 8) | b[1];
801 for (i = 1; i < 16; i++)
806 static int b44_uncompress(EXRContext *s, const uint8_t *src, int compressed_size,
807 int uncompressed_size, EXRThreadData *td) {
808 const int8_t *sr = src;
809 int stay_to_uncompress = compressed_size;
810 int nb_b44_block_w, nb_b44_block_h;
811 int index_tl_x, index_tl_y, index_out, index_tmp;
812 uint16_t tmp_buffer[16]; /* B44 use 4x4 half float pixel */
814 int target_channel_offset = 0;
816 /* calc B44 block count */
817 nb_b44_block_w = td->xsize / 4;
818 if ((td->xsize % 4) != 0)
821 nb_b44_block_h = td->ysize / 4;
822 if ((td->ysize % 4) != 0)
825 for (c = 0; c < s->nb_channels; c++) {
826 if (s->channels[c].pixel_type == EXR_HALF) {/* B44 only compress half float data */
827 for (iY = 0; iY < nb_b44_block_h; iY++) {
828 for (iX = 0; iX < nb_b44_block_w; iX++) {/* For each B44 block */
829 if (stay_to_uncompress < 3) {
830 av_log(s, AV_LOG_ERROR, "Not enough data for B44A block: %d", stay_to_uncompress);
831 return AVERROR_INVALIDDATA;
834 if (src[compressed_size - stay_to_uncompress + 2] == 0xfc) { /* B44A block */
835 unpack_3(sr, tmp_buffer);
837 stay_to_uncompress -= 3;
838 } else {/* B44 Block */
839 if (stay_to_uncompress < 14) {
840 av_log(s, AV_LOG_ERROR, "Not enough data for B44 block: %d", stay_to_uncompress);
841 return AVERROR_INVALIDDATA;
843 unpack_14(sr, tmp_buffer);
845 stay_to_uncompress -= 14;
848 /* copy data to uncompress buffer (B44 block can exceed target resolution)*/
852 for (y = index_tl_y; y < FFMIN(index_tl_y + 4, td->ysize); y++) {
853 for (x = index_tl_x; x < FFMIN(index_tl_x + 4, td->xsize); x++) {
854 index_out = target_channel_offset * td->xsize + y * td->channel_line_size + 2 * x;
855 index_tmp = (y-index_tl_y) * 4 + (x-index_tl_x);
856 td->uncompressed_data[index_out] = tmp_buffer[index_tmp] & 0xff;
857 td->uncompressed_data[index_out + 1] = tmp_buffer[index_tmp] >> 8;
862 target_channel_offset += 2;
863 } else {/* Float or UINT 32 channel */
864 if (stay_to_uncompress < td->ysize * td->xsize * 4) {
865 av_log(s, AV_LOG_ERROR, "Not enough data for uncompress channel: %d", stay_to_uncompress);
866 return AVERROR_INVALIDDATA;
869 for (y = 0; y < td->ysize; y++) {
870 index_out = target_channel_offset * td->xsize + y * td->channel_line_size;
871 memcpy(&td->uncompressed_data[index_out], sr, td->xsize * 4);
874 target_channel_offset += 4;
876 stay_to_uncompress -= td->ysize * td->xsize * 4;
883 static int ac_uncompress(EXRContext *s, GetByteContext *gb, float *block)
888 uint16_t val = bytestream2_get_ne16(gb);
892 } else if ((val >> 8) == 0xff) {
896 block[ff_zigzag_direct[n]] = av_int2float(half2float(val,
907 static void idct_1d(float *blk, int step)
909 const float a = .5f * cosf( M_PI / 4.f);
910 const float b = .5f * cosf( M_PI / 16.f);
911 const float c = .5f * cosf( M_PI / 8.f);
912 const float d = .5f * cosf(3.f*M_PI / 16.f);
913 const float e = .5f * cosf(5.f*M_PI / 16.f);
914 const float f = .5f * cosf(3.f*M_PI / 8.f);
915 const float g = .5f * cosf(7.f*M_PI / 16.f);
917 float alpha[4], beta[4], theta[4], gamma[4];
919 alpha[0] = c * blk[2 * step];
920 alpha[1] = f * blk[2 * step];
921 alpha[2] = c * blk[6 * step];
922 alpha[3] = f * blk[6 * step];
924 beta[0] = b * blk[1 * step] + d * blk[3 * step] + e * blk[5 * step] + g * blk[7 * step];
925 beta[1] = d * blk[1 * step] - g * blk[3 * step] - b * blk[5 * step] - e * blk[7 * step];
926 beta[2] = e * blk[1 * step] - b * blk[3 * step] + g * blk[5 * step] + d * blk[7 * step];
927 beta[3] = g * blk[1 * step] - e * blk[3 * step] + d * blk[5 * step] - b * blk[7 * step];
929 theta[0] = a * (blk[0 * step] + blk[4 * step]);
930 theta[3] = a * (blk[0 * step] - blk[4 * step]);
932 theta[1] = alpha[0] + alpha[3];
933 theta[2] = alpha[1] - alpha[2];
935 gamma[0] = theta[0] + theta[1];
936 gamma[1] = theta[3] + theta[2];
937 gamma[2] = theta[3] - theta[2];
938 gamma[3] = theta[0] - theta[1];
940 blk[0 * step] = gamma[0] + beta[0];
941 blk[1 * step] = gamma[1] + beta[1];
942 blk[2 * step] = gamma[2] + beta[2];
943 blk[3 * step] = gamma[3] + beta[3];
945 blk[4 * step] = gamma[3] - beta[3];
946 blk[5 * step] = gamma[2] - beta[2];
947 blk[6 * step] = gamma[1] - beta[1];
948 blk[7 * step] = gamma[0] - beta[0];
951 static void dct_inverse(float *block)
953 for (int i = 0; i < 8; i++)
954 idct_1d(block + i, 8);
956 for (int i = 0; i < 8; i++) {
962 static void convert(float y, float u, float v,
963 float *b, float *g, float *r)
965 *r = y + 1.5747f * v;
966 *g = y - 0.1873f * u - 0.4682f * v;
967 *b = y + 1.8556f * u;
970 static float to_linear(float x, float scale)
975 return FFSIGN(x) * powf(ax, 2.2f * scale);
977 const float log_base = expf(2.2f * scale);
979 return FFSIGN(x) * powf(log_base, ax - 1.f);
983 static int dwa_uncompress(EXRContext *s, const uint8_t *src, int compressed_size,
984 int uncompressed_size, EXRThreadData *td)
986 int64_t version, lo_usize, lo_size;
987 int64_t ac_size, dc_size, rle_usize, rle_csize, rle_raw_size;
988 int64_t ac_count, dc_count, ac_compression;
989 const int dc_w = td->xsize >> 3;
990 const int dc_h = td->ysize >> 3;
991 GetByteContext gb, agb;
994 if (compressed_size <= 88)
995 return AVERROR_INVALIDDATA;
997 version = AV_RL64(src + 0);
999 return AVERROR_INVALIDDATA;
1001 lo_usize = AV_RL64(src + 8);
1002 lo_size = AV_RL64(src + 16);
1003 ac_size = AV_RL64(src + 24);
1004 dc_size = AV_RL64(src + 32);
1005 rle_csize = AV_RL64(src + 40);
1006 rle_usize = AV_RL64(src + 48);
1007 rle_raw_size = AV_RL64(src + 56);
1008 ac_count = AV_RL64(src + 64);
1009 dc_count = AV_RL64(src + 72);
1010 ac_compression = AV_RL64(src + 80);
1012 if (compressed_size < 88LL + lo_size + ac_size + dc_size + rle_csize)
1013 return AVERROR_INVALIDDATA;
1015 bytestream2_init(&gb, src + 88, compressed_size - 88);
1016 skip = bytestream2_get_le16(&gb);
1018 return AVERROR_INVALIDDATA;
1020 bytestream2_skip(&gb, skip - 2);
1023 if (lo_usize > uncompressed_size)
1024 return AVERROR_INVALIDDATA;
1025 bytestream2_skip(&gb, lo_size);
1029 unsigned long dest_len = ac_count * 2LL;
1030 GetByteContext agb = gb;
1032 if (ac_count > 3LL * td->xsize * s->scan_lines_per_block)
1033 return AVERROR_INVALIDDATA;
1035 av_fast_padded_malloc(&td->ac_data, &td->ac_size, dest_len);
1037 return AVERROR(ENOMEM);
1039 switch (ac_compression) {
1041 ret = huf_uncompress(s, td, &agb, (int16_t *)td->ac_data, ac_count);
1046 if (uncompress(td->ac_data, &dest_len, agb.buffer, ac_size) != Z_OK ||
1047 dest_len != ac_count * 2LL)
1048 return AVERROR_INVALIDDATA;
1051 return AVERROR_INVALIDDATA;
1054 bytestream2_skip(&gb, ac_size);
1058 unsigned long dest_len = dc_count * 2LL;
1059 GetByteContext agb = gb;
1061 if (dc_count > (6LL * td->xsize * td->ysize + 63) / 64)
1062 return AVERROR_INVALIDDATA;
1064 av_fast_padded_malloc(&td->dc_data, &td->dc_size, FFALIGN(dest_len, 64) * 2);
1066 return AVERROR(ENOMEM);
1068 if (uncompress(td->dc_data + FFALIGN(dest_len, 64), &dest_len, agb.buffer, dc_size) != Z_OK ||
1069 (dest_len != dc_count * 2LL))
1070 return AVERROR_INVALIDDATA;
1072 s->dsp.predictor(td->dc_data + FFALIGN(dest_len, 64), dest_len);
1073 s->dsp.reorder_pixels(td->dc_data, td->dc_data + FFALIGN(dest_len, 64), dest_len);
1075 bytestream2_skip(&gb, dc_size);
1078 if (rle_raw_size > 0 && rle_csize > 0 && rle_usize > 0) {
1079 unsigned long dest_len = rle_usize;
1081 av_fast_padded_malloc(&td->rle_data, &td->rle_size, rle_usize);
1083 return AVERROR(ENOMEM);
1085 av_fast_padded_malloc(&td->rle_raw_data, &td->rle_raw_size, rle_raw_size);
1086 if (!td->rle_raw_data)
1087 return AVERROR(ENOMEM);
1089 if (uncompress(td->rle_data, &dest_len, gb.buffer, rle_csize) != Z_OK ||
1090 (dest_len != rle_usize))
1091 return AVERROR_INVALIDDATA;
1093 ret = rle(td->rle_raw_data, td->rle_data, rle_usize, rle_raw_size);
1096 bytestream2_skip(&gb, rle_csize);
1099 bytestream2_init(&agb, td->ac_data, ac_count * 2);
1101 for (int y = 0; y < td->ysize; y += 8) {
1102 for (int x = 0; x < td->xsize; x += 8) {
1103 memset(td->block, 0, sizeof(td->block));
1105 for (int j = 0; j < 3; j++) {
1106 float *block = td->block[j];
1107 const int idx = (x >> 3) + (y >> 3) * dc_w + dc_w * dc_h * j;
1108 uint16_t *dc = (uint16_t *)td->dc_data;
1109 union av_intfloat32 dc_val;
1111 dc_val.i = half2float(dc[idx], s->mantissatable,
1112 s->exponenttable, s->offsettable);
1114 block[0] = dc_val.f;
1115 ac_uncompress(s, &agb, block);
1120 const float scale = s->pixel_type == EXR_FLOAT ? 2.f : 1.f;
1121 const int o = s->nb_channels == 4;
1122 float *bo = ((float *)td->uncompressed_data) +
1123 y * td->xsize * s->nb_channels + td->xsize * (o + 0) + x;
1124 float *go = ((float *)td->uncompressed_data) +
1125 y * td->xsize * s->nb_channels + td->xsize * (o + 1) + x;
1126 float *ro = ((float *)td->uncompressed_data) +
1127 y * td->xsize * s->nb_channels + td->xsize * (o + 2) + x;
1128 float *yb = td->block[0];
1129 float *ub = td->block[1];
1130 float *vb = td->block[2];
1132 for (int yy = 0; yy < 8; yy++) {
1133 for (int xx = 0; xx < 8; xx++) {
1134 const int idx = xx + yy * 8;
1136 convert(yb[idx], ub[idx], vb[idx], &bo[xx], &go[xx], &ro[xx]);
1138 bo[xx] = to_linear(bo[xx], scale);
1139 go[xx] = to_linear(go[xx], scale);
1140 ro[xx] = to_linear(ro[xx], scale);
1143 bo += td->xsize * s->nb_channels;
1144 go += td->xsize * s->nb_channels;
1145 ro += td->xsize * s->nb_channels;
1151 if (s->nb_channels < 4)
1154 for (int y = 0; y < td->ysize && td->rle_raw_data; y++) {
1155 uint32_t *ao = ((uint32_t *)td->uncompressed_data) + y * td->xsize * s->nb_channels;
1156 uint8_t *ai0 = td->rle_raw_data + y * td->xsize;
1157 uint8_t *ai1 = td->rle_raw_data + y * td->xsize + rle_raw_size / 2;
1159 for (int x = 0; x < td->xsize; x++) {
1160 uint16_t ha = ai0[x] | (ai1[x] << 8);
1162 ao[x] = half2float(ha, s->mantissatable, s->exponenttable, s->offsettable);
1169 static int decode_block(AVCodecContext *avctx, void *tdata,
1170 int jobnr, int threadnr)
1172 EXRContext *s = avctx->priv_data;
1173 AVFrame *const p = s->picture;
1174 EXRThreadData *td = &s->thread_data[threadnr];
1175 const uint8_t *channel_buffer[4] = { 0 };
1176 const uint8_t *buf = s->buf;
1177 uint64_t line_offset, uncompressed_size;
1181 uint64_t tile_x, tile_y, tile_level_x, tile_level_y;
1183 int step = s->desc->flags & AV_PIX_FMT_FLAG_FLOAT ? 4 : 2 * s->desc->nb_components;
1184 int bxmin = 0, axmax = 0, window_xoffset = 0;
1185 int window_xmin, window_xmax, window_ymin, window_ymax;
1186 int data_xoffset, data_yoffset, data_window_offset, xsize, ysize;
1187 int i, x, buf_size = s->buf_size;
1188 int c, rgb_channel_count;
1189 float one_gamma = 1.0f / s->gamma;
1190 avpriv_trc_function trc_func = avpriv_get_trc_function_from_trc(s->apply_trc_type);
1193 line_offset = AV_RL64(s->gb.buffer + jobnr * 8);
1196 if (buf_size < 20 || line_offset > buf_size - 20)
1197 return AVERROR_INVALIDDATA;
1199 src = buf + line_offset + 20;
1200 if (s->is_multipart)
1203 tile_x = AV_RL32(src - 20);
1204 tile_y = AV_RL32(src - 16);
1205 tile_level_x = AV_RL32(src - 12);
1206 tile_level_y = AV_RL32(src - 8);
1208 data_size = AV_RL32(src - 4);
1209 if (data_size <= 0 || data_size > buf_size - line_offset - 20)
1210 return AVERROR_INVALIDDATA;
1212 if (tile_level_x || tile_level_y) { /* tile level, is not the full res level */
1213 avpriv_report_missing_feature(s->avctx, "Subres tile before full res tile");
1214 return AVERROR_PATCHWELCOME;
1217 line = s->ymin + s->tile_attr.ySize * tile_y;
1218 col = s->tile_attr.xSize * tile_x;
1220 if (line < s->ymin || line > s->ymax ||
1221 s->xmin + col < s->xmin || s->xmin + col > s->xmax)
1222 return AVERROR_INVALIDDATA;
1224 td->ysize = FFMIN(s->tile_attr.ySize, s->ydelta - tile_y * s->tile_attr.ySize);
1225 td->xsize = FFMIN(s->tile_attr.xSize, s->xdelta - tile_x * s->tile_attr.xSize);
1227 if (td->xsize * (uint64_t)s->current_channel_offset > INT_MAX)
1228 return AVERROR_INVALIDDATA;
1230 td->channel_line_size = td->xsize * s->current_channel_offset;/* uncompress size of one line */
1231 uncompressed_size = td->channel_line_size * (uint64_t)td->ysize;/* uncompress size of the block */
1233 if (buf_size < 8 || line_offset > buf_size - 8)
1234 return AVERROR_INVALIDDATA;
1236 src = buf + line_offset + 8;
1237 if (s->is_multipart)
1239 line = AV_RL32(src - 8);
1241 if (line < s->ymin || line > s->ymax)
1242 return AVERROR_INVALIDDATA;
1244 data_size = AV_RL32(src - 4);
1245 if (data_size <= 0 || data_size > buf_size - line_offset - 8)
1246 return AVERROR_INVALIDDATA;
1248 td->ysize = FFMIN(s->scan_lines_per_block, s->ymax - line + 1); /* s->ydelta - line ?? */
1249 td->xsize = s->xdelta;
1251 if (td->xsize * (uint64_t)s->current_channel_offset > INT_MAX)
1252 return AVERROR_INVALIDDATA;
1254 td->channel_line_size = td->xsize * s->current_channel_offset;/* uncompress size of one line */
1255 uncompressed_size = td->channel_line_size * (uint64_t)td->ysize;/* uncompress size of the block */
1257 if ((s->compression == EXR_RAW && (data_size != uncompressed_size ||
1258 line_offset > buf_size - uncompressed_size)) ||
1259 (s->compression != EXR_RAW && (data_size > uncompressed_size ||
1260 line_offset > buf_size - data_size))) {
1261 return AVERROR_INVALIDDATA;
1265 window_xmin = FFMIN(avctx->width, FFMAX(0, s->xmin + col));
1266 window_xmax = FFMIN(avctx->width, FFMAX(0, s->xmin + col + td->xsize));
1267 window_ymin = FFMIN(avctx->height, FFMAX(0, line ));
1268 window_ymax = FFMIN(avctx->height, FFMAX(0, line + td->ysize));
1269 xsize = window_xmax - window_xmin;
1270 ysize = window_ymax - window_ymin;
1272 /* tile or scanline not visible skip decoding */
1273 if (xsize <= 0 || ysize <= 0)
1276 /* is the first tile or is a scanline */
1279 /* pixels to add at the left of the display window */
1280 window_xoffset = FFMAX(0, s->xmin);
1281 /* bytes to add at the left of the display window */
1282 bxmin = window_xoffset * step;
1285 /* is the last tile or is a scanline */
1286 if(col + td->xsize == s->xdelta) {
1287 window_xmax = avctx->width;
1288 /* bytes to add at the right of the display window */
1289 axmax = FFMAX(0, (avctx->width - (s->xmax + 1))) * step;
1292 if (data_size < uncompressed_size || s->is_tile) { /* td->tmp is use for tile reorganization */
1293 av_fast_padded_malloc(&td->tmp, &td->tmp_size, uncompressed_size);
1295 return AVERROR(ENOMEM);
1298 if (data_size < uncompressed_size) {
1299 av_fast_padded_malloc(&td->uncompressed_data,
1300 &td->uncompressed_size, uncompressed_size + 64);/* Force 64 padding for AVX2 reorder_pixels dst */
1302 if (!td->uncompressed_data)
1303 return AVERROR(ENOMEM);
1305 ret = AVERROR_INVALIDDATA;
1306 switch (s->compression) {
1309 ret = zip_uncompress(s, src, data_size, uncompressed_size, td);
1312 ret = piz_uncompress(s, src, data_size, uncompressed_size, td);
1315 ret = pxr24_uncompress(s, src, data_size, uncompressed_size, td);
1318 ret = rle_uncompress(s, src, data_size, uncompressed_size, td);
1322 ret = b44_uncompress(s, src, data_size, uncompressed_size, td);
1326 ret = dwa_uncompress(s, src, data_size, uncompressed_size, td);
1330 av_log(avctx, AV_LOG_ERROR, "decode_block() failed.\n");
1333 src = td->uncompressed_data;
1336 /* offsets to crop data outside display window */
1337 data_xoffset = FFABS(FFMIN(0, s->xmin + col)) * (s->pixel_type == EXR_HALF ? 2 : 4);
1338 data_yoffset = FFABS(FFMIN(0, line));
1339 data_window_offset = (data_yoffset * td->channel_line_size) + data_xoffset;
1342 channel_buffer[0] = src + (td->xsize * s->channel_offsets[0]) + data_window_offset;
1343 channel_buffer[1] = src + (td->xsize * s->channel_offsets[1]) + data_window_offset;
1344 channel_buffer[2] = src + (td->xsize * s->channel_offsets[2]) + data_window_offset;
1345 rgb_channel_count = 3;
1346 } else { /* put y data in the first channel_buffer */
1347 channel_buffer[0] = src + (td->xsize * s->channel_offsets[1]) + data_window_offset;
1348 rgb_channel_count = 1;
1350 if (s->channel_offsets[3] >= 0)
1351 channel_buffer[3] = src + (td->xsize * s->channel_offsets[3]) + data_window_offset;
1353 if (s->desc->flags & AV_PIX_FMT_FLAG_FLOAT) {
1354 /* todo: change this when a floating point pixel format with luma with alpha is implemented */
1355 int channel_count = s->channel_offsets[3] >= 0 ? 4 : rgb_channel_count;
1357 channel_buffer[1] = channel_buffer[0];
1358 channel_buffer[2] = channel_buffer[0];
1361 for (c = 0; c < channel_count; c++) {
1362 int plane = s->desc->comp[c].plane;
1363 ptr = p->data[plane] + window_ymin * p->linesize[plane] + (window_xmin * 4);
1365 for (i = 0; i < ysize; i++, ptr += p->linesize[plane]) {
1367 union av_intfloat32 *ptr_x;
1369 src = channel_buffer[c];
1370 ptr_x = (union av_intfloat32 *)ptr;
1372 // Zero out the start if xmin is not 0
1373 memset(ptr_x, 0, bxmin);
1374 ptr_x += window_xoffset;
1376 if (s->pixel_type == EXR_FLOAT ||
1377 s->compression == EXR_DWAA ||
1378 s->compression == EXR_DWAB) {
1380 union av_intfloat32 t;
1381 if (trc_func && c < 3) {
1382 for (x = 0; x < xsize; x++) {
1383 t.i = bytestream_get_le32(&src);
1384 t.f = trc_func(t.f);
1387 } else if (one_gamma != 1.f) {
1388 for (x = 0; x < xsize; x++) {
1389 t.i = bytestream_get_le32(&src);
1390 if (t.f > 0.0f && c < 3) /* avoid negative values */
1391 t.f = powf(t.f, one_gamma);
1395 for (x = 0; x < xsize; x++) {
1396 t.i = bytestream_get_le32(&src);
1400 } else if (s->pixel_type == EXR_HALF) {
1402 if (c < 3 || !trc_func) {
1403 for (x = 0; x < xsize; x++) {
1404 *ptr_x++ = s->gamma_table[bytestream_get_le16(&src)];
1407 for (x = 0; x < xsize; x++) {
1408 ptr_x[0].i = half2float(bytestream_get_le16(&src),
1417 // Zero out the end if xmax+1 is not w
1418 memset(ptr_x, 0, axmax);
1419 channel_buffer[c] += td->channel_line_size;
1424 av_assert1(s->pixel_type == EXR_UINT);
1425 ptr = p->data[0] + window_ymin * p->linesize[0] + (window_xmin * s->desc->nb_components * 2);
1427 for (i = 0; i < ysize; i++, ptr += p->linesize[0]) {
1430 const uint8_t *rgb[3];
1433 for (c = 0; c < rgb_channel_count; c++) {
1434 rgb[c] = channel_buffer[c];
1437 if (channel_buffer[3])
1438 a = channel_buffer[3];
1440 ptr_x = (uint16_t *) ptr;
1442 // Zero out the start if xmin is not 0
1443 memset(ptr_x, 0, bxmin);
1444 ptr_x += window_xoffset * s->desc->nb_components;
1446 for (x = 0; x < xsize; x++) {
1447 for (c = 0; c < rgb_channel_count; c++) {
1448 *ptr_x++ = bytestream_get_le32(&rgb[c]) >> 16;
1451 if (channel_buffer[3])
1452 *ptr_x++ = bytestream_get_le32(&a) >> 16;
1455 // Zero out the end if xmax+1 is not w
1456 memset(ptr_x, 0, axmax);
1458 channel_buffer[0] += td->channel_line_size;
1459 channel_buffer[1] += td->channel_line_size;
1460 channel_buffer[2] += td->channel_line_size;
1461 if (channel_buffer[3])
1462 channel_buffer[3] += td->channel_line_size;
1469 static void skip_header_chunk(EXRContext *s)
1471 GetByteContext *gb = &s->gb;
1473 while (bytestream2_get_bytes_left(gb) > 0) {
1474 if (!bytestream2_peek_byte(gb))
1477 // Process unknown variables
1478 for (int i = 0; i < 2; i++) // value_name and value_type
1479 while (bytestream2_get_byte(gb) != 0);
1481 // Skip variable length
1482 bytestream2_skip(gb, bytestream2_get_le32(gb));
1487 * Check if the variable name corresponds to its data type.
1489 * @param s the EXRContext
1490 * @param value_name name of the variable to check
1491 * @param value_type type of the variable to check
1492 * @param minimum_length minimum length of the variable data
1494 * @return bytes to read containing variable data
1495 * -1 if variable is not found
1496 * 0 if buffer ended prematurely
1498 static int check_header_variable(EXRContext *s,
1499 const char *value_name,
1500 const char *value_type,
1501 unsigned int minimum_length)
1503 GetByteContext *gb = &s->gb;
1506 if (bytestream2_get_bytes_left(gb) >= minimum_length &&
1507 !strcmp(gb->buffer, value_name)) {
1508 // found value_name, jump to value_type (null terminated strings)
1509 gb->buffer += strlen(value_name) + 1;
1510 if (!strcmp(gb->buffer, value_type)) {
1511 gb->buffer += strlen(value_type) + 1;
1512 var_size = bytestream2_get_le32(gb);
1513 // don't go read past boundaries
1514 if (var_size > bytestream2_get_bytes_left(gb))
1517 // value_type not found, reset the buffer
1518 gb->buffer -= strlen(value_name) + 1;
1519 av_log(s->avctx, AV_LOG_WARNING,
1520 "Unknown data type %s for header variable %s.\n",
1521 value_type, value_name);
1528 static int decode_header(EXRContext *s, AVFrame *frame)
1530 AVDictionary *metadata = NULL;
1531 GetByteContext *gb = &s->gb;
1532 int magic_number, version, flags;
1533 int layer_match = 0;
1535 int dup_channels = 0;
1537 s->current_channel_offset = 0;
1544 s->channel_offsets[0] = -1;
1545 s->channel_offsets[1] = -1;
1546 s->channel_offsets[2] = -1;
1547 s->channel_offsets[3] = -1;
1548 s->pixel_type = EXR_UNKNOWN;
1549 s->compression = EXR_UNKN;
1553 s->tile_attr.xSize = -1;
1554 s->tile_attr.ySize = -1;
1556 s->is_multipart = 0;
1558 s->current_part = 0;
1560 if (bytestream2_get_bytes_left(gb) < 10) {
1561 av_log(s->avctx, AV_LOG_ERROR, "Header too short to parse.\n");
1562 return AVERROR_INVALIDDATA;
1565 magic_number = bytestream2_get_le32(gb);
1566 if (magic_number != 20000630) {
1567 /* As per documentation of OpenEXR, it is supposed to be
1568 * int 20000630 little-endian */
1569 av_log(s->avctx, AV_LOG_ERROR, "Wrong magic number %d.\n", magic_number);
1570 return AVERROR_INVALIDDATA;
1573 version = bytestream2_get_byte(gb);
1575 avpriv_report_missing_feature(s->avctx, "Version %d", version);
1576 return AVERROR_PATCHWELCOME;
1579 flags = bytestream2_get_le24(gb);
1584 s->is_multipart = 1;
1586 avpriv_report_missing_feature(s->avctx, "deep data");
1587 return AVERROR_PATCHWELCOME;
1591 while (bytestream2_get_bytes_left(gb) > 0) {
1594 while (s->is_multipart && s->current_part < s->selected_part &&
1595 bytestream2_get_bytes_left(gb) > 0) {
1596 if (bytestream2_peek_byte(gb)) {
1597 skip_header_chunk(s);
1599 bytestream2_skip(gb, 1);
1600 if (!bytestream2_peek_byte(gb))
1603 bytestream2_skip(gb, 1);
1607 if (!bytestream2_peek_byte(gb)) {
1608 if (!s->is_multipart)
1610 bytestream2_skip(gb, 1);
1611 if (s->current_part == s->selected_part) {
1612 while (bytestream2_get_bytes_left(gb) > 0) {
1613 if (bytestream2_peek_byte(gb)) {
1614 skip_header_chunk(s);
1616 bytestream2_skip(gb, 1);
1617 if (!bytestream2_peek_byte(gb))
1622 if (!bytestream2_peek_byte(gb))
1627 if ((var_size = check_header_variable(s, "channels",
1628 "chlist", 38)) >= 0) {
1629 GetByteContext ch_gb;
1631 ret = AVERROR_INVALIDDATA;
1635 bytestream2_init(&ch_gb, gb->buffer, var_size);
1637 while (bytestream2_get_bytes_left(&ch_gb) >= 19) {
1638 EXRChannel *channel;
1639 enum ExrPixelType current_pixel_type;
1640 int channel_index = -1;
1643 if (strcmp(s->layer, "") != 0) {
1644 if (strncmp(ch_gb.buffer, s->layer, strlen(s->layer)) == 0) {
1646 av_log(s->avctx, AV_LOG_INFO,
1647 "Channel match layer : %s.\n", ch_gb.buffer);
1648 ch_gb.buffer += strlen(s->layer);
1649 if (*ch_gb.buffer == '.')
1650 ch_gb.buffer++; /* skip dot if not given */
1653 av_log(s->avctx, AV_LOG_INFO,
1654 "Channel doesn't match layer : %s.\n", ch_gb.buffer);
1660 if (layer_match) { /* only search channel if the layer match is valid */
1661 if (!av_strcasecmp(ch_gb.buffer, "R") ||
1662 !av_strcasecmp(ch_gb.buffer, "X") ||
1663 !av_strcasecmp(ch_gb.buffer, "U")) {
1666 } else if (!av_strcasecmp(ch_gb.buffer, "G") ||
1667 !av_strcasecmp(ch_gb.buffer, "V")) {
1670 } else if (!av_strcasecmp(ch_gb.buffer, "Y")) {
1673 } else if (!av_strcasecmp(ch_gb.buffer, "B") ||
1674 !av_strcasecmp(ch_gb.buffer, "Z") ||
1675 !av_strcasecmp(ch_gb.buffer, "W")) {
1678 } else if (!av_strcasecmp(ch_gb.buffer, "A")) {
1681 av_log(s->avctx, AV_LOG_WARNING,
1682 "Unsupported channel %.256s.\n", ch_gb.buffer);
1686 /* skip until you get a 0 */
1687 while (bytestream2_get_bytes_left(&ch_gb) > 0 &&
1688 bytestream2_get_byte(&ch_gb))
1691 if (bytestream2_get_bytes_left(&ch_gb) < 4) {
1692 av_log(s->avctx, AV_LOG_ERROR, "Incomplete header.\n");
1693 ret = AVERROR_INVALIDDATA;
1697 current_pixel_type = bytestream2_get_le32(&ch_gb);
1698 if (current_pixel_type >= EXR_UNKNOWN) {
1699 avpriv_report_missing_feature(s->avctx, "Pixel type %d",
1700 current_pixel_type);
1701 ret = AVERROR_PATCHWELCOME;
1705 bytestream2_skip(&ch_gb, 4);
1706 xsub = bytestream2_get_le32(&ch_gb);
1707 ysub = bytestream2_get_le32(&ch_gb);
1709 if (xsub != 1 || ysub != 1) {
1710 avpriv_report_missing_feature(s->avctx,
1711 "Subsampling %dx%d",
1713 ret = AVERROR_PATCHWELCOME;
1717 if (channel_index >= 0 && s->channel_offsets[channel_index] == -1) { /* channel has not been previously assigned */
1718 if (s->pixel_type != EXR_UNKNOWN &&
1719 s->pixel_type != current_pixel_type) {
1720 av_log(s->avctx, AV_LOG_ERROR,
1721 "RGB channels not of the same depth.\n");
1722 ret = AVERROR_INVALIDDATA;
1725 s->pixel_type = current_pixel_type;
1726 s->channel_offsets[channel_index] = s->current_channel_offset;
1727 } else if (channel_index >= 0) {
1728 av_log(s->avctx, AV_LOG_WARNING,
1729 "Multiple channels with index %d.\n", channel_index);
1730 if (++dup_channels > 10) {
1731 ret = AVERROR_INVALIDDATA;
1736 s->channels = av_realloc(s->channels,
1737 ++s->nb_channels * sizeof(EXRChannel));
1739 ret = AVERROR(ENOMEM);
1742 channel = &s->channels[s->nb_channels - 1];
1743 channel->pixel_type = current_pixel_type;
1744 channel->xsub = xsub;
1745 channel->ysub = ysub;
1747 if (current_pixel_type == EXR_HALF) {
1748 s->current_channel_offset += 2;
1749 } else {/* Float or UINT32 */
1750 s->current_channel_offset += 4;
1754 /* Check if all channels are set with an offset or if the channels
1755 * are causing an overflow */
1756 if (!s->is_luma) {/* if we expected to have at least 3 channels */
1757 if (FFMIN3(s->channel_offsets[0],
1758 s->channel_offsets[1],
1759 s->channel_offsets[2]) < 0) {
1760 if (s->channel_offsets[0] < 0)
1761 av_log(s->avctx, AV_LOG_ERROR, "Missing red channel.\n");
1762 if (s->channel_offsets[1] < 0)
1763 av_log(s->avctx, AV_LOG_ERROR, "Missing green channel.\n");
1764 if (s->channel_offsets[2] < 0)
1765 av_log(s->avctx, AV_LOG_ERROR, "Missing blue channel.\n");
1766 ret = AVERROR_INVALIDDATA;
1771 // skip one last byte and update main gb
1772 gb->buffer = ch_gb.buffer + 1;
1774 } else if ((var_size = check_header_variable(s, "dataWindow", "box2i",
1776 int xmin, ymin, xmax, ymax;
1778 ret = AVERROR_INVALIDDATA;
1782 xmin = bytestream2_get_le32(gb);
1783 ymin = bytestream2_get_le32(gb);
1784 xmax = bytestream2_get_le32(gb);
1785 ymax = bytestream2_get_le32(gb);
1787 if (xmin > xmax || ymin > ymax ||
1788 (unsigned)xmax - xmin >= INT_MAX ||
1789 (unsigned)ymax - ymin >= INT_MAX) {
1790 ret = AVERROR_INVALIDDATA;
1797 s->xdelta = (s->xmax - s->xmin) + 1;
1798 s->ydelta = (s->ymax - s->ymin) + 1;
1801 } else if ((var_size = check_header_variable(s, "displayWindow",
1802 "box2i", 34)) >= 0) {
1803 int32_t sx, sy, dx, dy;
1806 ret = AVERROR_INVALIDDATA;
1810 sx = bytestream2_get_le32(gb);
1811 sy = bytestream2_get_le32(gb);
1812 dx = bytestream2_get_le32(gb);
1813 dy = bytestream2_get_le32(gb);
1819 } else if ((var_size = check_header_variable(s, "lineOrder",
1820 "lineOrder", 25)) >= 0) {
1823 ret = AVERROR_INVALIDDATA;
1827 line_order = bytestream2_get_byte(gb);
1828 av_log(s->avctx, AV_LOG_DEBUG, "line order: %d.\n", line_order);
1829 if (line_order > 2) {
1830 av_log(s->avctx, AV_LOG_ERROR, "Unknown line order.\n");
1831 ret = AVERROR_INVALIDDATA;
1836 } else if ((var_size = check_header_variable(s, "pixelAspectRatio",
1837 "float", 31)) >= 0) {
1839 ret = AVERROR_INVALIDDATA;
1843 s->sar = bytestream2_get_le32(gb);
1846 } else if ((var_size = check_header_variable(s, "compression",
1847 "compression", 29)) >= 0) {
1849 ret = AVERROR_INVALIDDATA;
1853 if (s->compression == EXR_UNKN)
1854 s->compression = bytestream2_get_byte(gb);
1856 bytestream2_skip(gb, 1);
1857 av_log(s->avctx, AV_LOG_WARNING,
1858 "Found more than one compression attribute.\n");
1862 } else if ((var_size = check_header_variable(s, "tiles",
1863 "tiledesc", 22)) >= 0) {
1867 av_log(s->avctx, AV_LOG_WARNING,
1868 "Found tile attribute and scanline flags. Exr will be interpreted as scanline.\n");
1870 s->tile_attr.xSize = bytestream2_get_le32(gb);
1871 s->tile_attr.ySize = bytestream2_get_le32(gb);
1873 tileLevel = bytestream2_get_byte(gb);
1874 s->tile_attr.level_mode = tileLevel & 0x0f;
1875 s->tile_attr.level_round = (tileLevel >> 4) & 0x0f;
1877 if (s->tile_attr.level_mode >= EXR_TILE_LEVEL_UNKNOWN) {
1878 avpriv_report_missing_feature(s->avctx, "Tile level mode %d",
1879 s->tile_attr.level_mode);
1880 ret = AVERROR_PATCHWELCOME;
1884 if (s->tile_attr.level_round >= EXR_TILE_ROUND_UNKNOWN) {
1885 avpriv_report_missing_feature(s->avctx, "Tile level round %d",
1886 s->tile_attr.level_round);
1887 ret = AVERROR_PATCHWELCOME;
1892 } else if ((var_size = check_header_variable(s, "writer",
1893 "string", 1)) >= 0) {
1894 uint8_t key[256] = { 0 };
1896 bytestream2_get_buffer(gb, key, FFMIN(sizeof(key) - 1, var_size));
1897 av_dict_set(&metadata, "writer", key, 0);
1900 } else if ((var_size = check_header_variable(s, "framesPerSecond",
1901 "rational", 33)) >= 0) {
1903 ret = AVERROR_INVALIDDATA;
1907 s->avctx->framerate.num = bytestream2_get_le32(gb);
1908 s->avctx->framerate.den = bytestream2_get_le32(gb);
1911 } else if ((var_size = check_header_variable(s, "chunkCount",
1914 s->chunk_count = bytestream2_get_le32(gb);
1917 } else if ((var_size = check_header_variable(s, "type",
1918 "string", 16)) >= 0) {
1919 uint8_t key[256] = { 0 };
1921 bytestream2_get_buffer(gb, key, FFMIN(sizeof(key) - 1, var_size));
1922 if (strncmp("scanlineimage", key, var_size) &&
1923 strncmp("tiledimage", key, var_size))
1924 return AVERROR_PATCHWELCOME;
1927 } else if ((var_size = check_header_variable(s, "preview",
1928 "preview", 16)) >= 0) {
1929 uint32_t pw = bytestream2_get_le32(gb);
1930 uint32_t ph = bytestream2_get_le32(gb);
1931 int64_t psize = 4LL * pw * ph;
1933 if (psize >= bytestream2_get_bytes_left(gb))
1934 return AVERROR_INVALIDDATA;
1936 bytestream2_skip(gb, psize);
1941 // Check if there are enough bytes for a header
1942 if (bytestream2_get_bytes_left(gb) <= 9) {
1943 av_log(s->avctx, AV_LOG_ERROR, "Incomplete header\n");
1944 ret = AVERROR_INVALIDDATA;
1948 // Process unknown variables
1950 uint8_t name[256] = { 0 };
1951 uint8_t type[256] = { 0 };
1952 uint8_t value[256] = { 0 };
1955 while (bytestream2_get_bytes_left(gb) > 0 &&
1956 bytestream2_peek_byte(gb) && i < 255) {
1957 name[i++] = bytestream2_get_byte(gb);
1960 bytestream2_skip(gb, 1);
1962 while (bytestream2_get_bytes_left(gb) > 0 &&
1963 bytestream2_peek_byte(gb) && i < 255) {
1964 type[i++] = bytestream2_get_byte(gb);
1966 bytestream2_skip(gb, 1);
1967 size = bytestream2_get_le32(gb);
1969 bytestream2_get_buffer(gb, value, FFMIN(sizeof(value) - 1, size));
1970 if (!strcmp(type, "string"))
1971 av_dict_set(&metadata, name, value, 0);
1975 if (s->compression == EXR_UNKN) {
1976 av_log(s->avctx, AV_LOG_ERROR, "Missing compression attribute.\n");
1977 ret = AVERROR_INVALIDDATA;
1982 if (s->tile_attr.xSize < 1 || s->tile_attr.ySize < 1) {
1983 av_log(s->avctx, AV_LOG_ERROR, "Invalid tile attribute.\n");
1984 ret = AVERROR_INVALIDDATA;
1989 if (bytestream2_get_bytes_left(gb) <= 0) {
1990 av_log(s->avctx, AV_LOG_ERROR, "Incomplete frame.\n");
1991 ret = AVERROR_INVALIDDATA;
1995 frame->metadata = metadata;
1997 // aaand we are done
1998 bytestream2_skip(gb, 1);
2001 av_dict_free(&metadata);
2005 static int decode_frame(AVCodecContext *avctx, void *data,
2006 int *got_frame, AVPacket *avpkt)
2008 EXRContext *s = avctx->priv_data;
2009 GetByteContext *gb = &s->gb;
2010 ThreadFrame frame = { .f = data };
2011 AVFrame *picture = data;
2014 int i, y, ret, ymax;
2017 int nb_blocks; /* nb scanline or nb tile */
2018 uint64_t start_offset_table;
2019 uint64_t start_next_scanline;
2020 PutByteContext offset_table_writer;
2022 bytestream2_init(gb, avpkt->data, avpkt->size);
2024 if ((ret = decode_header(s, picture)) < 0)
2027 if ((s->compression == EXR_DWAA || s->compression == EXR_DWAB) &&
2028 s->pixel_type == EXR_HALF) {
2029 s->current_channel_offset *= 2;
2030 for (int i = 0; i < 4; i++)
2031 s->channel_offsets[i] *= 2;
2034 switch (s->pixel_type) {
2037 if (s->channel_offsets[3] >= 0) {
2039 avctx->pix_fmt = AV_PIX_FMT_GBRAPF32;
2041 /* todo: change this when a floating point pixel format with luma with alpha is implemented */
2042 avctx->pix_fmt = AV_PIX_FMT_GBRAPF32;
2046 avctx->pix_fmt = AV_PIX_FMT_GBRPF32;
2048 avctx->pix_fmt = AV_PIX_FMT_GRAYF32;
2053 if (s->channel_offsets[3] >= 0) {
2055 avctx->pix_fmt = AV_PIX_FMT_RGBA64;
2057 avctx->pix_fmt = AV_PIX_FMT_YA16;
2061 avctx->pix_fmt = AV_PIX_FMT_RGB48;
2063 avctx->pix_fmt = AV_PIX_FMT_GRAY16;
2068 av_log(avctx, AV_LOG_ERROR, "Missing channel list.\n");
2069 return AVERROR_INVALIDDATA;
2072 if (s->apply_trc_type != AVCOL_TRC_UNSPECIFIED)
2073 avctx->color_trc = s->apply_trc_type;
2075 switch (s->compression) {
2079 s->scan_lines_per_block = 1;
2083 s->scan_lines_per_block = 16;
2089 s->scan_lines_per_block = 32;
2092 s->scan_lines_per_block = 256;
2095 avpriv_report_missing_feature(avctx, "Compression %d", s->compression);
2096 return AVERROR_PATCHWELCOME;
2099 /* Verify the xmin, xmax, ymin and ymax before setting the actual image size.
2100 * It's possible for the data window can larger or outside the display window */
2101 if (s->xmin > s->xmax || s->ymin > s->ymax ||
2102 s->ydelta == 0xFFFFFFFF || s->xdelta == 0xFFFFFFFF) {
2103 av_log(avctx, AV_LOG_ERROR, "Wrong or missing size information.\n");
2104 return AVERROR_INVALIDDATA;
2107 if ((ret = ff_set_dimensions(avctx, s->w, s->h)) < 0)
2110 ff_set_sar(s->avctx, av_d2q(av_int2float(s->sar), 255));
2112 s->desc = av_pix_fmt_desc_get(avctx->pix_fmt);
2114 return AVERROR_INVALIDDATA;
2116 if (s->desc->flags & AV_PIX_FMT_FLAG_FLOAT) {
2117 planes = s->desc->nb_components;
2118 out_line_size = avctx->width * 4;
2121 out_line_size = avctx->width * 2 * s->desc->nb_components;
2125 nb_blocks = ((s->xdelta + s->tile_attr.xSize - 1) / s->tile_attr.xSize) *
2126 ((s->ydelta + s->tile_attr.ySize - 1) / s->tile_attr.ySize);
2127 } else { /* scanline */
2128 nb_blocks = (s->ydelta + s->scan_lines_per_block - 1) /
2129 s->scan_lines_per_block;
2132 if ((ret = ff_thread_get_buffer(avctx, &frame, 0)) < 0)
2135 if (bytestream2_get_bytes_left(gb)/8 < nb_blocks)
2136 return AVERROR_INVALIDDATA;
2138 // check offset table and recreate it if need
2139 if (!s->is_tile && bytestream2_peek_le64(gb) == 0) {
2140 av_log(s->avctx, AV_LOG_DEBUG, "recreating invalid scanline offset table\n");
2142 start_offset_table = bytestream2_tell(gb);
2143 start_next_scanline = start_offset_table + nb_blocks * 8;
2144 bytestream2_init_writer(&offset_table_writer, &avpkt->data[start_offset_table], nb_blocks * 8);
2146 for (y = 0; y < nb_blocks; y++) {
2147 /* write offset of prev scanline in offset table */
2148 bytestream2_put_le64(&offset_table_writer, start_next_scanline);
2150 /* get len of next scanline */
2151 bytestream2_seek(gb, start_next_scanline + 4, SEEK_SET);/* skip line number */
2152 start_next_scanline += (bytestream2_get_le32(gb) + 8);
2154 bytestream2_seek(gb, start_offset_table, SEEK_SET);
2157 // save pointer we are going to use in decode_block
2158 s->buf = avpkt->data;
2159 s->buf_size = avpkt->size;
2161 // Zero out the start if ymin is not 0
2162 for (i = 0; i < planes; i++) {
2163 ptr = picture->data[i];
2164 for (y = 0; y < FFMIN(s->ymin, s->h); y++) {
2165 memset(ptr, 0, out_line_size);
2166 ptr += picture->linesize[i];
2170 s->picture = picture;
2172 avctx->execute2(avctx, decode_block, s->thread_data, NULL, nb_blocks);
2174 ymax = FFMAX(0, s->ymax + 1);
2175 // Zero out the end if ymax+1 is not h
2176 if (ymax < avctx->height)
2177 for (i = 0; i < planes; i++) {
2178 ptr = picture->data[i] + (ymax * picture->linesize[i]);
2179 for (y = ymax; y < avctx->height; y++) {
2180 memset(ptr, 0, out_line_size);
2181 ptr += picture->linesize[i];
2185 picture->pict_type = AV_PICTURE_TYPE_I;
2191 static av_cold int decode_init(AVCodecContext *avctx)
2193 EXRContext *s = avctx->priv_data;
2195 union av_intfloat32 t;
2196 float one_gamma = 1.0f / s->gamma;
2197 avpriv_trc_function trc_func = NULL;
2199 half2float_table(s->mantissatable, s->exponenttable, s->offsettable);
2203 ff_exrdsp_init(&s->dsp);
2206 ff_bswapdsp_init(&s->bbdsp);
2209 trc_func = avpriv_get_trc_function_from_trc(s->apply_trc_type);
2211 for (i = 0; i < 65536; ++i) {
2212 t.i = half2float(i, s->mantissatable, s->exponenttable, s->offsettable);
2213 t.f = trc_func(t.f);
2214 s->gamma_table[i] = t;
2217 if (one_gamma > 0.9999f && one_gamma < 1.0001f) {
2218 for (i = 0; i < 65536; ++i) {
2219 s->gamma_table[i].i = half2float(i, s->mantissatable, s->exponenttable, s->offsettable);
2222 for (i = 0; i < 65536; ++i) {
2223 t.i = half2float(i, s->mantissatable, s->exponenttable, s->offsettable);
2224 /* If negative value we reuse half value */
2226 s->gamma_table[i] = t;
2228 t.f = powf(t.f, one_gamma);
2229 s->gamma_table[i] = t;
2235 // allocate thread data, used for non EXR_RAW compression types
2236 s->thread_data = av_mallocz_array(avctx->thread_count, sizeof(EXRThreadData));
2237 if (!s->thread_data)
2238 return AVERROR_INVALIDDATA;
2243 static av_cold int decode_end(AVCodecContext *avctx)
2245 EXRContext *s = avctx->priv_data;
2247 for (i = 0; i < avctx->thread_count; i++) {
2248 EXRThreadData *td = &s->thread_data[i];
2249 av_freep(&td->uncompressed_data);
2251 av_freep(&td->bitmap);
2254 av_freep(&td->freq);
2255 av_freep(&td->ac_data);
2256 av_freep(&td->dc_data);
2257 av_freep(&td->rle_data);
2258 av_freep(&td->rle_raw_data);
2259 ff_free_vlc(&td->vlc);
2262 av_freep(&s->thread_data);
2263 av_freep(&s->channels);
2268 #define OFFSET(x) offsetof(EXRContext, x)
2269 #define VD AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_DECODING_PARAM
2270 static const AVOption options[] = {
2271 { "layer", "Set the decoding layer", OFFSET(layer),
2272 AV_OPT_TYPE_STRING, { .str = "" }, 0, 0, VD },
2273 { "part", "Set the decoding part", OFFSET(selected_part),
2274 AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, VD },
2275 { "gamma", "Set the float gamma value when decoding", OFFSET(gamma),
2276 AV_OPT_TYPE_FLOAT, { .dbl = 1.0f }, 0.001, FLT_MAX, VD },
2278 // XXX: Note the abuse of the enum using AVCOL_TRC_UNSPECIFIED to subsume the existing gamma option
2279 { "apply_trc", "color transfer characteristics to apply to EXR linear input", OFFSET(apply_trc_type),
2280 AV_OPT_TYPE_INT, {.i64 = AVCOL_TRC_UNSPECIFIED }, 1, AVCOL_TRC_NB-1, VD, "apply_trc_type"},
2281 { "bt709", "BT.709", 0,
2282 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_BT709 }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2283 { "gamma", "gamma", 0,
2284 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_UNSPECIFIED }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2285 { "gamma22", "BT.470 M", 0,
2286 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_GAMMA22 }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2287 { "gamma28", "BT.470 BG", 0,
2288 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_GAMMA28 }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2289 { "smpte170m", "SMPTE 170 M", 0,
2290 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_SMPTE170M }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2291 { "smpte240m", "SMPTE 240 M", 0,
2292 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_SMPTE240M }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2293 { "linear", "Linear", 0,
2294 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_LINEAR }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2296 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_LOG }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2297 { "log_sqrt", "Log square root", 0,
2298 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_LOG_SQRT }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2299 { "iec61966_2_4", "IEC 61966-2-4", 0,
2300 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_IEC61966_2_4 }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2301 { "bt1361", "BT.1361", 0,
2302 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_BT1361_ECG }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2303 { "iec61966_2_1", "IEC 61966-2-1", 0,
2304 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_IEC61966_2_1 }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2305 { "bt2020_10bit", "BT.2020 - 10 bit", 0,
2306 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_BT2020_10 }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2307 { "bt2020_12bit", "BT.2020 - 12 bit", 0,
2308 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_BT2020_12 }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2309 { "smpte2084", "SMPTE ST 2084", 0,
2310 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_SMPTEST2084 }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2311 { "smpte428_1", "SMPTE ST 428-1", 0,
2312 AV_OPT_TYPE_CONST, {.i64 = AVCOL_TRC_SMPTEST428_1 }, INT_MIN, INT_MAX, VD, "apply_trc_type"},
2317 static const AVClass exr_class = {
2318 .class_name = "EXR",
2319 .item_name = av_default_item_name,
2321 .version = LIBAVUTIL_VERSION_INT,
2324 AVCodec ff_exr_decoder = {
2326 .long_name = NULL_IF_CONFIG_SMALL("OpenEXR image"),
2327 .type = AVMEDIA_TYPE_VIDEO,
2328 .id = AV_CODEC_ID_EXR,
2329 .priv_data_size = sizeof(EXRContext),
2330 .init = decode_init,
2331 .close = decode_end,
2332 .decode = decode_frame,
2333 .capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS |
2334 AV_CODEC_CAP_SLICE_THREADS,
2335 .priv_class = &exr_class,