3 * Copyright (c) 2000, 2001 Fabrice Bellard
4 * Copyright (c) 2003 Alex Beregszaszi
5 * Copyright (c) 2003-2004 Michael Niedermayer
7 * Support for external huffman table, various fixes (AVID workaround),
8 * aspecting, new decode_frame mechanism and apple mjpeg-b support
11 * This file is part of FFmpeg.
13 * FFmpeg is free software; you can redistribute it and/or
14 * modify it under the terms of the GNU Lesser General Public
15 * License as published by the Free Software Foundation; either
16 * version 2.1 of the License, or (at your option) any later version.
18 * FFmpeg is distributed in the hope that it will be useful,
19 * but WITHOUT ANY WARRANTY; without even the implied warranty of
20 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21 * Lesser General Public License for more details.
23 * You should have received a copy of the GNU Lesser General Public
24 * License along with FFmpeg; if not, write to the Free Software
25 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
36 #include "libavutil/imgutils.h"
37 #include "libavutil/avassert.h"
42 #include "jpeglsdec.h"
45 static int build_vlc(VLC *vlc, const uint8_t *bits_table, const uint8_t *val_table,
46 int nb_codes, int use_static, int is_ac)
48 uint8_t huff_size[256];
49 uint16_t huff_code[256];
50 uint16_t huff_sym[256];
53 assert(nb_codes <= 256);
55 memset(huff_size, 0, sizeof(huff_size));
56 ff_mjpeg_build_huffman_codes(huff_size, huff_code, bits_table, val_table);
59 huff_sym[i]= i + 16*is_ac;
61 if(is_ac) huff_sym[0]= 16*256;
63 return init_vlc_sparse(vlc, 9, nb_codes, huff_size, 1, 1, huff_code, 2, 2, huff_sym, 2, 2, use_static);
66 static void build_basic_mjpeg_vlc(MJpegDecodeContext * s) {
67 build_vlc(&s->vlcs[0][0], ff_mjpeg_bits_dc_luminance,
68 ff_mjpeg_val_dc, 12, 0, 0);
69 build_vlc(&s->vlcs[0][1], ff_mjpeg_bits_dc_chrominance,
70 ff_mjpeg_val_dc, 12, 0, 0);
71 build_vlc(&s->vlcs[1][0], ff_mjpeg_bits_ac_luminance,
72 ff_mjpeg_val_ac_luminance, 251, 0, 1);
73 build_vlc(&s->vlcs[1][1], ff_mjpeg_bits_ac_chrominance,
74 ff_mjpeg_val_ac_chrominance, 251, 0, 1);
75 build_vlc(&s->vlcs[2][0], ff_mjpeg_bits_ac_luminance,
76 ff_mjpeg_val_ac_luminance, 251, 0, 0);
77 build_vlc(&s->vlcs[2][1], ff_mjpeg_bits_ac_chrominance,
78 ff_mjpeg_val_ac_chrominance, 251, 0, 0);
81 av_cold int ff_mjpeg_decode_init(AVCodecContext *avctx)
83 MJpegDecodeContext *s = avctx->priv_data;
86 s->picture_ptr = &s->picture;
87 avcodec_get_frame_defaults(&s->picture);
90 dsputil_init(&s->dsp, avctx);
91 ff_init_scantable(s->dsp.idct_permutation, &s->scantable, ff_zigzag_direct);
96 s->org_height = avctx->coded_height;
97 avctx->chroma_sample_location = AVCHROMA_LOC_CENTER;
99 build_basic_mjpeg_vlc(s);
101 if (avctx->flags & CODEC_FLAG_EXTERN_HUFF)
103 av_log(avctx, AV_LOG_INFO, "mjpeg: using external huffman table\n");
104 init_get_bits(&s->gb, avctx->extradata, avctx->extradata_size*8);
105 if (ff_mjpeg_decode_dht(s)) {
106 av_log(avctx, AV_LOG_ERROR, "mjpeg: error using external huffman table, switching back to internal\n");
107 build_basic_mjpeg_vlc(s);
110 if (avctx->extradata_size > 9 &&
111 AV_RL32(avctx->extradata + 4) == MKTAG('f','i','e','l')) {
112 if (avctx->extradata[9] == 6) { /* quicktime icefloe 019 */
113 s->interlace_polarity = 1; /* bottom field first */
114 av_log(avctx, AV_LOG_DEBUG, "mjpeg bottom field first\n");
117 if (avctx->codec->id == CODEC_ID_AMV)
124 /* quantize tables */
125 int ff_mjpeg_decode_dqt(MJpegDecodeContext *s)
127 int len, index, i, j;
129 len = get_bits(&s->gb, 16) - 2;
132 /* only 8 bit precision handled */
133 if (get_bits(&s->gb, 4) != 0)
135 av_log(s->avctx, AV_LOG_ERROR, "dqt: 16bit precision\n");
138 index = get_bits(&s->gb, 4);
141 av_log(s->avctx, AV_LOG_DEBUG, "index=%d\n", index);
142 /* read quant table */
144 j = s->scantable.permutated[i];
145 s->quant_matrixes[index][j] = get_bits(&s->gb, 8);
148 //XXX FIXME finetune, and perhaps add dc too
149 s->qscale[index]= FFMAX(
150 s->quant_matrixes[index][s->scantable.permutated[1]],
151 s->quant_matrixes[index][s->scantable.permutated[8]]) >> 1;
152 av_log(s->avctx, AV_LOG_DEBUG, "qscale[%d]: %d\n", index, s->qscale[index]);
159 /* decode huffman tables and build VLC decoders */
160 int ff_mjpeg_decode_dht(MJpegDecodeContext *s)
162 int len, index, i, class, n, v, code_max;
163 uint8_t bits_table[17];
164 uint8_t val_table[256];
166 len = get_bits(&s->gb, 16) - 2;
171 class = get_bits(&s->gb, 4);
174 index = get_bits(&s->gb, 4);
179 bits_table[i] = get_bits(&s->gb, 8);
183 if (len < n || n > 256)
188 v = get_bits(&s->gb, 8);
195 /* build VLC and flush previous vlc if present */
196 free_vlc(&s->vlcs[class][index]);
197 av_log(s->avctx, AV_LOG_DEBUG, "class=%d index=%d nb_codes=%d\n",
198 class, index, code_max + 1);
199 if(build_vlc(&s->vlcs[class][index], bits_table, val_table, code_max + 1, 0, class > 0) < 0){
204 free_vlc(&s->vlcs[2][index]);
205 if(build_vlc(&s->vlcs[2][index], bits_table, val_table, code_max + 1, 0, 0) < 0){
213 int ff_mjpeg_decode_sof(MJpegDecodeContext *s)
215 int len, nb_components, i, width, height, pix_fmt_id;
217 /* XXX: verify len field validity */
218 len = get_bits(&s->gb, 16);
219 s->bits= get_bits(&s->gb, 8);
221 if(s->pegasus_rct) s->bits=9;
222 if(s->bits==9 && !s->pegasus_rct) s->rct=1; //FIXME ugly
224 if (s->bits != 8 && !s->lossless){
225 av_log(s->avctx, AV_LOG_ERROR, "only 8 bits/component accepted\n");
229 height = get_bits(&s->gb, 16);
230 width = get_bits(&s->gb, 16);
232 //HACK for odd_height.mov
233 if(s->interlaced && s->width == width && s->height == height + 1)
236 av_log(s->avctx, AV_LOG_DEBUG, "sof0: picture: %dx%d\n", width, height);
237 if(av_image_check_size(width, height, 0, s->avctx))
240 nb_components = get_bits(&s->gb, 8);
241 if (nb_components <= 0 ||
242 nb_components > MAX_COMPONENTS)
244 if (s->ls && !(s->bits <= 8 || nb_components == 1)){
245 av_log(s->avctx, AV_LOG_ERROR, "only <= 8 bits/component or 16-bit gray accepted for JPEG-LS\n");
248 s->nb_components = nb_components;
251 for(i=0;i<nb_components;i++) {
253 s->component_id[i] = get_bits(&s->gb, 8) - 1;
254 s->h_count[i] = get_bits(&s->gb, 4);
255 s->v_count[i] = get_bits(&s->gb, 4);
256 /* compute hmax and vmax (only used in interleaved case) */
257 if (s->h_count[i] > s->h_max)
258 s->h_max = s->h_count[i];
259 if (s->v_count[i] > s->v_max)
260 s->v_max = s->v_count[i];
261 s->quant_index[i] = get_bits(&s->gb, 8);
262 if (s->quant_index[i] >= 4)
264 av_log(s->avctx, AV_LOG_DEBUG, "component %d %d:%d id: %d quant:%d\n", i, s->h_count[i],
265 s->v_count[i], s->component_id[i], s->quant_index[i]);
268 if(s->ls && (s->h_max > 1 || s->v_max > 1)) {
269 av_log(s->avctx, AV_LOG_ERROR, "Subsampling in JPEG-LS is not supported.\n");
273 if(s->v_max==1 && s->h_max==1 && s->lossless==1) s->rgb=1;
275 /* if different size, realloc/alloc picture */
276 /* XXX: also check h_count and v_count */
277 if (width != s->width || height != s->height) {
278 av_freep(&s->qscale_table);
284 /* test interlaced mode */
285 if (s->first_picture &&
286 s->org_height != 0 &&
287 s->height < ((s->org_height * 3) / 4)) {
289 s->bottom_field = s->interlace_polarity;
290 s->picture_ptr->interlaced_frame = 1;
291 s->picture_ptr->top_field_first = !s->interlace_polarity;
295 avcodec_set_dimensions(s->avctx, width, height);
297 s->qscale_table= av_mallocz((s->width+15)/16);
299 s->first_picture = 0;
302 if(s->interlaced && (s->bottom_field == !s->interlace_polarity))
305 /* XXX: not complete test ! */
306 pix_fmt_id = (s->h_count[0] << 28) | (s->v_count[0] << 24) |
307 (s->h_count[1] << 20) | (s->v_count[1] << 16) |
308 (s->h_count[2] << 12) | (s->v_count[2] << 8) |
309 (s->h_count[3] << 4) | s->v_count[3];
310 av_log(s->avctx, AV_LOG_DEBUG, "pix fmt id %x\n", pix_fmt_id);
311 //NOTE we do not allocate pictures large enough for the possible padding of h/v_count being 4
312 if(!(pix_fmt_id & 0xD0D0D0D0))
313 pix_fmt_id-= (pix_fmt_id & 0xF0F0F0F0)>>1;
314 if(!(pix_fmt_id & 0x0D0D0D0D))
315 pix_fmt_id-= (pix_fmt_id & 0x0F0F0F0F)>>1;
320 s->avctx->pix_fmt = PIX_FMT_BGRA;
322 s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV444P : PIX_FMT_YUVJ444P;
323 assert(s->nb_components==3);
326 s->avctx->pix_fmt = PIX_FMT_GRAY8;
329 s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV440P : PIX_FMT_YUVJ440P;
332 s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV422P : PIX_FMT_YUVJ422P;
335 s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV420P : PIX_FMT_YUVJ420P;
338 av_log(s->avctx, AV_LOG_ERROR, "Unhandled pixel format 0x%x\n", pix_fmt_id);
342 if(s->nb_components > 1)
343 s->avctx->pix_fmt = PIX_FMT_RGB24;
344 else if(s->bits <= 8)
345 s->avctx->pix_fmt = PIX_FMT_GRAY8;
347 s->avctx->pix_fmt = PIX_FMT_GRAY16;
350 if(s->picture_ptr->data[0])
351 s->avctx->release_buffer(s->avctx, s->picture_ptr);
353 if(s->avctx->get_buffer(s->avctx, s->picture_ptr) < 0){
354 av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed\n");
357 s->picture_ptr->pict_type= AV_PICTURE_TYPE_I;
358 s->picture_ptr->key_frame= 1;
362 s->linesize[i]= s->picture_ptr->linesize[i] << s->interlaced;
365 // printf("%d %d %d %d %d %d\n", s->width, s->height, s->linesize[0], s->linesize[1], s->interlaced, s->avctx->height);
367 if (len != (8+(3*nb_components)))
369 av_log(s->avctx, AV_LOG_DEBUG, "decode_sof0: error, len(%d) mismatch\n", len);
372 /* totally blank picture as progressive JPEG will only add details to it */
374 int bw = (width + s->h_max*8-1) / (s->h_max*8);
375 int bh = (height + s->v_max*8-1) / (s->v_max*8);
376 for(i=0; i<s->nb_components; i++) {
377 int size = bw * bh * s->h_count[i] * s->v_count[i];
378 av_freep(&s->blocks[i]);
379 av_freep(&s->last_nnz[i]);
380 s->blocks[i] = av_malloc(size * sizeof(**s->blocks));
381 s->last_nnz[i] = av_mallocz(size * sizeof(**s->last_nnz));
382 s->block_stride[i] = bw * s->h_count[i];
384 memset(s->coefs_finished, 0, sizeof(s->coefs_finished));
389 static inline int mjpeg_decode_dc(MJpegDecodeContext *s, int dc_index)
392 code = get_vlc2(&s->gb, s->vlcs[0][dc_index].table, 9, 2);
395 av_log(s->avctx, AV_LOG_WARNING, "mjpeg_decode_dc: bad vlc: %d:%d (%p)\n", 0, dc_index,
396 &s->vlcs[0][dc_index]);
401 return get_xbits(&s->gb, code);
406 /* decode block and dequantize */
407 static int decode_block(MJpegDecodeContext *s, DCTELEM *block,
408 int component, int dc_index, int ac_index, int16_t *quant_matrix)
410 int code, i, j, level, val;
413 val = mjpeg_decode_dc(s, dc_index);
415 av_log(s->avctx, AV_LOG_ERROR, "error dc\n");
418 val = val * quant_matrix[0] + s->last_dc[component];
419 s->last_dc[component] = val;
423 {OPEN_READER(re, &s->gb);
425 UPDATE_CACHE(re, &s->gb);
426 GET_VLC(code, re, &s->gb, s->vlcs[1][ac_index].table, 9, 2);
428 i += ((unsigned)code) >> 4;
431 if(code > MIN_CACHE_BITS - 16){
432 UPDATE_CACHE(re, &s->gb);
435 int cache=GET_CACHE(re,&s->gb);
436 int sign=(~cache)>>31;
437 level = (NEG_USR32(sign ^ cache,code) ^ sign) - sign;
440 LAST_SKIP_BITS(re, &s->gb, code);
443 av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);
446 j = s->scantable.permutated[i];
447 block[j] = level * quant_matrix[j];
450 CLOSE_READER(re, &s->gb);}
455 static int decode_dc_progressive(MJpegDecodeContext *s, DCTELEM *block, int component,
456 int dc_index, int16_t *quant_matrix, int Al)
459 s->dsp.clear_block(block);
460 val = mjpeg_decode_dc(s, dc_index);
462 av_log(s->avctx, AV_LOG_ERROR, "error dc\n");
465 val = (val * quant_matrix[0] << Al) + s->last_dc[component];
466 s->last_dc[component] = val;
471 /* decode block and dequantize - progressive JPEG version */
472 static int decode_block_progressive(MJpegDecodeContext *s, DCTELEM *block, uint8_t *last_nnz,
473 int ac_index, int16_t *quant_matrix,
474 int ss, int se, int Al, int *EOBRUN)
476 int code, i, j, level, val, run;
482 {OPEN_READER(re, &s->gb);
484 UPDATE_CACHE(re, &s->gb);
485 GET_VLC(code, re, &s->gb, s->vlcs[2][ac_index].table, 9, 2);
487 run = ((unsigned) code) >> 4;
491 if(code > MIN_CACHE_BITS - 16){
492 UPDATE_CACHE(re, &s->gb);
495 int cache=GET_CACHE(re,&s->gb);
496 int sign=(~cache)>>31;
497 level = (NEG_USR32(sign ^ cache,code) ^ sign) - sign;
500 LAST_SKIP_BITS(re, &s->gb, code);
504 j = s->scantable.permutated[se];
505 block[j] = level * quant_matrix[j] << Al;
508 av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);
511 j = s->scantable.permutated[i];
512 block[j] = level * quant_matrix[j] << Al;
514 if(run == 0xF){// ZRL - skip 15 coefficients
517 av_log(s->avctx, AV_LOG_ERROR, "ZRL overflow: %d\n", i);
523 UPDATE_CACHE(re, &s->gb);
524 val += NEG_USR32(GET_CACHE(re, &s->gb), run);
525 LAST_SKIP_BITS(re, &s->gb, run);
532 CLOSE_READER(re, &s->gb);}
538 #define REFINE_BIT(j) {\
539 UPDATE_CACHE(re, &s->gb);\
540 sign = block[j]>>15;\
541 block[j] += SHOW_UBITS(re, &s->gb, 1) * ((quant_matrix[j]^sign)-sign) << Al;\
542 LAST_SKIP_BITS(re, &s->gb, 1);\
550 av_log(s->avctx, AV_LOG_ERROR, "error count: %d\n", i);\
555 j = s->scantable.permutated[i];\
562 /* decode block and dequantize - progressive JPEG refinement pass */
563 static int decode_block_refinement(MJpegDecodeContext *s, DCTELEM *block, uint8_t *last_nnz,
564 int ac_index, int16_t *quant_matrix,
565 int ss, int se, int Al, int *EOBRUN)
567 int code, i=ss, j, sign, val, run;
568 int last = FFMIN(se, *last_nnz);
570 OPEN_READER(re, &s->gb);
575 UPDATE_CACHE(re, &s->gb);
576 GET_VLC(code, re, &s->gb, s->vlcs[2][ac_index].table, 9, 2);
579 run = ((unsigned) code) >> 4;
580 UPDATE_CACHE(re, &s->gb);
581 val = SHOW_UBITS(re, &s->gb, 1);
582 LAST_SKIP_BITS(re, &s->gb, 1);
584 j = s->scantable.permutated[i];
586 block[j] = ((quant_matrix[j]^val)-val) << Al;
590 CLOSE_READER(re, &s->gb);
594 run = ((unsigned) code) >> 4;
601 UPDATE_CACHE(re, &s->gb);
602 run += SHOW_UBITS(re, &s->gb, val);
603 LAST_SKIP_BITS(re, &s->gb, val);
616 j = s->scantable.permutated[i];
620 CLOSE_READER(re, &s->gb);
627 static int ljpeg_decode_rgb_scan(MJpegDecodeContext *s, int predictor, int point_transform){
629 uint16_t (*buffer)[4];
630 int left[3], top[3], topleft[3];
631 const int linesize= s->linesize[0];
632 const int mask= (1<<s->bits)-1;
634 av_fast_malloc(&s->ljpeg_buffer, &s->ljpeg_buffer_size, (unsigned)s->mb_width * 4 * sizeof(s->ljpeg_buffer[0][0]));
635 buffer= s->ljpeg_buffer;
638 buffer[0][i]= 1 << (s->bits + point_transform - 1);
640 for(mb_y = 0; mb_y < s->mb_height; mb_y++) {
641 const int modified_predictor= mb_y ? predictor : 1;
642 uint8_t *ptr = s->picture.data[0] + (linesize * mb_y);
644 if (s->interlaced && s->bottom_field)
645 ptr += linesize >> 1;
648 top[i]= left[i]= topleft[i]= buffer[0][i];
650 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
651 if (s->restart_interval && !s->restart_count)
652 s->restart_count = s->restart_interval;
658 top[i]= buffer[mb_x][i];
660 PREDICT(pred, topleft[i], top[i], left[i], modified_predictor);
663 buffer[mb_x][i]= mask & (pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform));
666 if (s->restart_interval && !--s->restart_count) {
667 align_get_bits(&s->gb);
668 skip_bits(&s->gb, 16); /* skip RSTn */
673 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
674 ptr[4*mb_x+1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2] - 0x200)>>2);
675 ptr[4*mb_x+0] = buffer[mb_x][1] + ptr[4*mb_x+1];
676 ptr[4*mb_x+2] = buffer[mb_x][2] + ptr[4*mb_x+1];
678 }else if(s->pegasus_rct){
679 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
680 ptr[4*mb_x+1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2])>>2);
681 ptr[4*mb_x+0] = buffer[mb_x][1] + ptr[4*mb_x+1];
682 ptr[4*mb_x+2] = buffer[mb_x][2] + ptr[4*mb_x+1];
685 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
686 ptr[4*mb_x+0] = buffer[mb_x][2];
687 ptr[4*mb_x+1] = buffer[mb_x][1];
688 ptr[4*mb_x+2] = buffer[mb_x][0];
695 static int ljpeg_decode_yuv_scan(MJpegDecodeContext *s, int predictor, int point_transform){
697 const int nb_components=3;
699 for(mb_y = 0; mb_y < s->mb_height; mb_y++) {
700 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
701 if (s->restart_interval && !s->restart_count)
702 s->restart_count = s->restart_interval;
704 if(mb_x==0 || mb_y==0 || s->interlaced){
705 for(i=0;i<nb_components;i++) {
707 int n, h, v, x, y, c, j, linesize;
709 c = s->comp_index[i];
714 linesize= s->linesize[c];
719 ptr = s->picture.data[c] + (linesize * (v * mb_y + y)) + (h * mb_x + x); //FIXME optimize this crap
722 pred= 128 << point_transform;
728 pred= ptr[-linesize];
730 PREDICT(pred, ptr[-linesize-1], ptr[-linesize], ptr[-1], predictor);
734 if (s->interlaced && s->bottom_field)
735 ptr += linesize >> 1;
736 *ptr= pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform);
745 for(i=0;i<nb_components;i++) {
747 int n, h, v, x, y, c, j, linesize;
749 c = s->comp_index[i];
754 linesize= s->linesize[c];
759 ptr = s->picture.data[c] + (linesize * (v * mb_y + y)) + (h * mb_x + x); //FIXME optimize this crap
760 PREDICT(pred, ptr[-linesize-1], ptr[-linesize], ptr[-1], predictor);
761 *ptr= pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform);
769 if (s->restart_interval && !--s->restart_count) {
770 align_get_bits(&s->gb);
771 skip_bits(&s->gb, 16); /* skip RSTn */
778 static av_always_inline void mjpeg_copy_block(uint8_t *dst, const uint8_t *src,
779 int linesize, int lowres)
782 case 0: copy_block8(dst, src, linesize, linesize, 8);
784 case 1: copy_block4(dst, src, linesize, linesize, 4);
786 case 2: copy_block2(dst, src, linesize, linesize, 2);
793 static int mjpeg_decode_scan(MJpegDecodeContext *s, int nb_components, int Ah, int Al,
794 const uint8_t *mb_bitmask, const AVFrame *reference){
796 uint8_t* data[MAX_COMPONENTS];
797 const uint8_t *reference_data[MAX_COMPONENTS];
798 int linesize[MAX_COMPONENTS];
799 GetBitContext mb_bitmask_gb;
802 init_get_bits(&mb_bitmask_gb, mb_bitmask, s->mb_width*s->mb_height);
805 if(s->flipped && s->avctx->flags & CODEC_FLAG_EMU_EDGE) {
806 av_log(s->avctx, AV_LOG_ERROR, "Can not flip image with CODEC_FLAG_EMU_EDGE set!\n");
809 for(i=0; i < nb_components; i++) {
810 int c = s->comp_index[i];
811 data[c] = s->picture_ptr->data[c];
812 reference_data[c] = reference ? reference->data[c] : NULL;
813 linesize[c]=s->linesize[c];
814 s->coefs_finished[c] |= 1;
816 //picture should be flipped upside-down for this codec
817 int offset = (linesize[c] * (s->v_scount[i] * (8 * s->mb_height -((s->height/s->v_max)&7)) - 1 ));
819 reference_data[c] += offset;
824 for(mb_y = 0; mb_y < s->mb_height; mb_y++) {
825 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
826 const int copy_mb = mb_bitmask && !get_bits1(&mb_bitmask_gb);
828 if (s->restart_interval && !s->restart_count)
829 s->restart_count = s->restart_interval;
831 if(get_bits_count(&s->gb)>s->gb.size_in_bits){
832 av_log(s->avctx, AV_LOG_ERROR, "overread %d\n", get_bits_count(&s->gb) - s->gb.size_in_bits);
835 for(i=0;i<nb_components;i++) {
837 int n, h, v, x, y, c, j;
840 c = s->comp_index[i];
846 block_offset = (((linesize[c] * (v * mb_y + y) * 8) +
847 (h * mb_x + x) * 8) >> s->avctx->lowres);
849 if(s->interlaced && s->bottom_field)
850 block_offset += linesize[c] >> 1;
851 ptr = data[c] + block_offset;
852 if(!s->progressive) {
854 mjpeg_copy_block(ptr, reference_data[c] + block_offset, linesize[c], s->avctx->lowres);
856 s->dsp.clear_block(s->block);
857 if(decode_block(s, s->block, i,
858 s->dc_index[i], s->ac_index[i],
859 s->quant_matrixes[ s->quant_index[c] ]) < 0) {
860 av_log(s->avctx, AV_LOG_ERROR, "error y=%d x=%d\n", mb_y, mb_x);
863 s->dsp.idct_put(ptr, linesize[c], s->block);
866 int block_idx = s->block_stride[c] * (v * mb_y + y) + (h * mb_x + x);
867 DCTELEM *block = s->blocks[c][block_idx];
869 block[0] += get_bits1(&s->gb) * s->quant_matrixes[ s->quant_index[c] ][0] << Al;
870 else if(decode_dc_progressive(s, block, i, s->dc_index[i], s->quant_matrixes[ s->quant_index[c] ], Al) < 0) {
871 av_log(s->avctx, AV_LOG_ERROR, "error y=%d x=%d\n", mb_y, mb_x);
875 // av_log(s->avctx, AV_LOG_DEBUG, "mb: %d %d processed\n", mb_y, mb_x);
876 //av_log(NULL, AV_LOG_DEBUG, "%d %d %d %d %d %d %d %d \n", mb_x, mb_y, x, y, c, s->bottom_field, (v * mb_y + y) * 8, (h * mb_x + x) * 8);
884 if (s->restart_interval && show_bits(&s->gb, 8) == 0xFF){ /* skip RSTn */
886 align_get_bits(&s->gb);
887 while(show_bits(&s->gb, 8) == 0xFF)
888 skip_bits(&s->gb, 8);
889 skip_bits(&s->gb, 8);
890 for (i=0; i<nb_components; i++) /* reset dc */
891 s->last_dc[i] = 1024;
898 static int mjpeg_decode_scan_progressive_ac(MJpegDecodeContext *s, int ss, int se, int Ah, int Al){
901 int c = s->comp_index[0];
902 uint8_t* data = s->picture.data[c];
903 int linesize = s->linesize[c];
905 int16_t *quant_matrix = s->quant_matrixes[ s->quant_index[c] ];
908 s->coefs_finished[c] |= (1LL<<(se+1))-(1LL<<ss);
909 last_scan = !~s->coefs_finished[c];
912 if(s->interlaced && s->bottom_field)
913 data += linesize >> 1;
915 for(mb_y = 0; mb_y < s->mb_height; mb_y++) {
916 uint8_t *ptr = data + (mb_y*linesize*8 >> s->avctx->lowres);
917 int block_idx = mb_y * s->block_stride[c];
918 DCTELEM (*block)[64] = &s->blocks[c][block_idx];
919 uint8_t *last_nnz = &s->last_nnz[c][block_idx];
920 for(mb_x = 0; mb_x < s->mb_width; mb_x++, block++, last_nnz++) {
923 ret = decode_block_refinement(s, *block, last_nnz, s->ac_index[0],
924 quant_matrix, ss, se, Al, &EOBRUN);
926 ret = decode_block_progressive(s, *block, last_nnz, s->ac_index[0],
927 quant_matrix, ss, se, Al, &EOBRUN);
929 av_log(s->avctx, AV_LOG_ERROR, "error y=%d x=%d\n", mb_y, mb_x);
933 s->dsp.idct_put(ptr, linesize, *block);
934 ptr += 8 >> s->avctx->lowres;
941 int ff_mjpeg_decode_sos(MJpegDecodeContext *s,
942 const uint8_t *mb_bitmask, const AVFrame *reference)
944 int len, nb_components, i, h, v, predictor, point_transform;
946 const int block_size= s->lossless ? 1 : 8;
949 /* XXX: verify len field validity */
950 len = get_bits(&s->gb, 16);
951 nb_components = get_bits(&s->gb, 8);
952 if (nb_components == 0 || nb_components > MAX_COMPONENTS){
953 av_log(s->avctx, AV_LOG_ERROR, "decode_sos: nb_components (%d) unsupported\n", nb_components);
956 if (len != 6+2*nb_components)
958 av_log(s->avctx, AV_LOG_ERROR, "decode_sos: invalid len (%d)\n", len);
961 for(i=0;i<nb_components;i++) {
962 id = get_bits(&s->gb, 8) - 1;
963 av_log(s->avctx, AV_LOG_DEBUG, "component: %d\n", id);
964 /* find component index */
965 for(index=0;index<s->nb_components;index++)
966 if (id == s->component_id[index])
968 if (index == s->nb_components)
970 av_log(s->avctx, AV_LOG_ERROR, "decode_sos: index(%d) out of components\n", index);
973 /* Metasoft MJPEG codec has Cb and Cr swapped */
974 if (s->avctx->codec_tag == MKTAG('M', 'T', 'S', 'J')
975 && nb_components == 3 && s->nb_components == 3 && i)
978 s->comp_index[i] = index;
980 s->nb_blocks[i] = s->h_count[index] * s->v_count[index];
981 s->h_scount[i] = s->h_count[index];
982 s->v_scount[i] = s->v_count[index];
984 s->dc_index[i] = get_bits(&s->gb, 4);
985 s->ac_index[i] = get_bits(&s->gb, 4);
987 if (s->dc_index[i] < 0 || s->ac_index[i] < 0 ||
988 s->dc_index[i] >= 4 || s->ac_index[i] >= 4)
990 if (!s->vlcs[0][s->dc_index[i]].table || !s->vlcs[1][s->ac_index[i]].table)
994 predictor= get_bits(&s->gb, 8); /* JPEG Ss / lossless JPEG predictor /JPEG-LS NEAR */
995 ilv= get_bits(&s->gb, 8); /* JPEG Se / JPEG-LS ILV */
996 if(s->avctx->codec_tag != AV_RL32("CJPG")){
997 prev_shift = get_bits(&s->gb, 4); /* Ah */
998 point_transform= get_bits(&s->gb, 4); /* Al */
1000 prev_shift= point_transform= 0;
1002 for(i=0;i<nb_components;i++)
1003 s->last_dc[i] = 1024;
1005 if (nb_components > 1) {
1006 /* interleaved stream */
1007 s->mb_width = (s->width + s->h_max * block_size - 1) / (s->h_max * block_size);
1008 s->mb_height = (s->height + s->v_max * block_size - 1) / (s->v_max * block_size);
1009 } else if(!s->ls) { /* skip this for JPEG-LS */
1010 h = s->h_max / s->h_scount[0];
1011 v = s->v_max / s->v_scount[0];
1012 s->mb_width = (s->width + h * block_size - 1) / (h * block_size);
1013 s->mb_height = (s->height + v * block_size - 1) / (v * block_size);
1014 s->nb_blocks[0] = 1;
1019 if(s->avctx->debug & FF_DEBUG_PICT_INFO)
1020 av_log(s->avctx, AV_LOG_DEBUG, "%s %s p:%d >>:%d ilv:%d bits:%d skip:%d %s\n", s->lossless ? "lossless" : "sequential DCT", s->rgb ? "RGB" : "",
1021 predictor, point_transform, ilv, s->bits, s->mjpb_skiptosod,
1022 s->pegasus_rct ? "PRCT" : (s->rct ? "RCT" : ""));
1025 /* mjpeg-b can have padding bytes between sos and image data, skip them */
1026 for (i = s->mjpb_skiptosod; i > 0; i--)
1027 skip_bits(&s->gb, 8);
1030 av_assert0(s->picture_ptr == &s->picture);
1031 if(CONFIG_JPEGLS_DECODER && s->ls){
1033 // reset_ls_coding_parameters(s, 0);
1035 if(ff_jpegls_decode_picture(s, predictor, point_transform, ilv) < 0)
1039 if(ljpeg_decode_rgb_scan(s, predictor, point_transform) < 0)
1042 if(ljpeg_decode_yuv_scan(s, predictor, point_transform) < 0)
1047 if(s->progressive && predictor) {
1048 av_assert0(s->picture_ptr == &s->picture);
1049 if(mjpeg_decode_scan_progressive_ac(s, predictor, ilv, prev_shift, point_transform) < 0)
1052 if(mjpeg_decode_scan(s, nb_components, prev_shift, point_transform,
1053 mb_bitmask, reference) < 0)
1060 av_log(s->avctx, AV_LOG_ERROR, "decode_sos: ac/dc index out of range\n");
1064 static int mjpeg_decode_dri(MJpegDecodeContext *s)
1066 if (get_bits(&s->gb, 16) != 4)
1068 s->restart_interval = get_bits(&s->gb, 16);
1069 s->restart_count = 0;
1070 av_log(s->avctx, AV_LOG_DEBUG, "restart interval: %d\n", s->restart_interval);
1075 static int mjpeg_decode_app(MJpegDecodeContext *s)
1079 len = get_bits(&s->gb, 16);
1082 if(8*len + get_bits_count(&s->gb) > s->gb.size_in_bits)
1085 id = get_bits_long(&s->gb, 32);
1086 id = av_be2ne32(id);
1089 if(s->avctx->debug & FF_DEBUG_STARTCODE){
1090 av_log(s->avctx, AV_LOG_DEBUG, "APPx %8X\n", id);
1093 /* buggy AVID, it puts EOI only at every 10th frame */
1094 /* also this fourcc is used by non-avid files too, it holds some
1095 informations, but it's always present in AVID creates files */
1096 if (id == AV_RL32("AVI1"))
1103 4bytes field_size_less_padding
1106 // if (s->first_picture)
1107 // printf("mjpeg: workarounding buggy AVID\n");
1108 i = get_bits(&s->gb, 8);
1109 if (i==2) s->bottom_field= 1;
1110 else if(i==1) s->bottom_field= 0;
1112 skip_bits(&s->gb, 8);
1113 skip_bits(&s->gb, 32);
1114 skip_bits(&s->gb, 32);
1117 // if (s->interlace_polarity)
1118 // printf("mjpeg: interlace polarity: %d\n", s->interlace_polarity);
1124 if (id == AV_RL32("JFIF"))
1126 int t_w, t_h, v1, v2;
1127 skip_bits(&s->gb, 8); /* the trailing zero-byte */
1128 v1= get_bits(&s->gb, 8);
1129 v2= get_bits(&s->gb, 8);
1130 skip_bits(&s->gb, 8);
1132 s->avctx->sample_aspect_ratio.num= get_bits(&s->gb, 16);
1133 s->avctx->sample_aspect_ratio.den= get_bits(&s->gb, 16);
1135 if (s->avctx->debug & FF_DEBUG_PICT_INFO)
1136 av_log(s->avctx, AV_LOG_INFO, "mjpeg: JFIF header found (version: %x.%x) SAR=%d/%d\n",
1138 s->avctx->sample_aspect_ratio.num,
1139 s->avctx->sample_aspect_ratio.den
1142 t_w = get_bits(&s->gb, 8);
1143 t_h = get_bits(&s->gb, 8);
1146 /* skip thumbnail */
1147 if (len-10-(t_w*t_h*3) > 0)
1154 if (id == AV_RL32("Adob") && (get_bits(&s->gb, 8) == 'e'))
1156 if (s->avctx->debug & FF_DEBUG_PICT_INFO)
1157 av_log(s->avctx, AV_LOG_INFO, "mjpeg: Adobe header found\n");
1158 skip_bits(&s->gb, 16); /* version */
1159 skip_bits(&s->gb, 16); /* flags0 */
1160 skip_bits(&s->gb, 16); /* flags1 */
1161 skip_bits(&s->gb, 8); /* transform */
1166 if (id == AV_RL32("LJIF")){
1167 if (s->avctx->debug & FF_DEBUG_PICT_INFO)
1168 av_log(s->avctx, AV_LOG_INFO, "Pegasus lossless jpeg header found\n");
1169 skip_bits(&s->gb, 16); /* version ? */
1170 skip_bits(&s->gb, 16); /* unknwon always 0? */
1171 skip_bits(&s->gb, 16); /* unknwon always 0? */
1172 skip_bits(&s->gb, 16); /* unknwon always 0? */
1173 switch( get_bits(&s->gb, 8)){
1183 av_log(s->avctx, AV_LOG_ERROR, "unknown colorspace\n");
1190 if ((s->start_code == APP1) && (len > (0x28 - 8)))
1192 id = get_bits_long(&s->gb, 32);
1193 id = av_be2ne32(id);
1195 if (id == AV_RL32("mjpg")) /* Apple MJPEG-A */
1198 skip_bits(&s->gb, 32); /* field size */
1199 skip_bits(&s->gb, 32); /* pad field size */
1200 skip_bits(&s->gb, 32); /* next off */
1201 skip_bits(&s->gb, 32); /* quant off */
1202 skip_bits(&s->gb, 32); /* huff off */
1203 skip_bits(&s->gb, 32); /* image off */
1204 skip_bits(&s->gb, 32); /* scan off */
1205 skip_bits(&s->gb, 32); /* data off */
1207 if (s->avctx->debug & FF_DEBUG_PICT_INFO)
1208 av_log(s->avctx, AV_LOG_INFO, "mjpeg: Apple MJPEG-A header found\n");
1213 /* slow but needed for extreme adobe jpegs */
1215 av_log(s->avctx, AV_LOG_ERROR, "mjpeg: error, decode_app parser read over the end\n");
1217 skip_bits(&s->gb, 8);
1222 static int mjpeg_decode_com(MJpegDecodeContext *s)
1224 int len = get_bits(&s->gb, 16);
1225 if (len >= 2 && 8*len - 16 + get_bits_count(&s->gb) <= s->gb.size_in_bits) {
1226 char *cbuf = av_malloc(len - 1);
1229 for (i = 0; i < len - 2; i++)
1230 cbuf[i] = get_bits(&s->gb, 8);
1231 if (i > 0 && cbuf[i-1] == '\n')
1236 if(s->avctx->debug & FF_DEBUG_PICT_INFO)
1237 av_log(s->avctx, AV_LOG_INFO, "mjpeg comment: '%s'\n", cbuf);
1239 /* buggy avid, it puts EOI only at every 10th frame */
1240 if (!strcmp(cbuf, "AVID"))
1243 // if (s->first_picture)
1244 // printf("mjpeg: workarounding buggy AVID\n");
1246 else if(!strcmp(cbuf, "CS=ITU601")){
1249 else if((len > 20 && !strncmp(cbuf, "Intel(R) JPEG Library", 21)) ||
1250 (len > 19 && !strncmp(cbuf, "Metasoft MJPEG Codec", 20))){
1261 /* return the 8 bit start code value and update the search
1262 state. Return -1 if no start code found */
1263 static int find_marker(const uint8_t **pbuf_ptr, const uint8_t *buf_end)
1265 const uint8_t *buf_ptr;
1270 buf_ptr = *pbuf_ptr;
1271 while (buf_ptr < buf_end) {
1274 if ((v == 0xff) && (v2 >= 0xc0) && (v2 <= 0xfe) && buf_ptr < buf_end) {
1282 av_dlog(NULL, "find_marker skipped %d bytes\n", skipped);
1283 *pbuf_ptr = buf_ptr;
1287 int ff_mjpeg_find_marker(MJpegDecodeContext *s,
1288 const uint8_t **buf_ptr, const uint8_t *buf_end,
1289 const uint8_t **unescaped_buf_ptr, int *unescaped_buf_size)
1292 start_code = find_marker(buf_ptr, buf_end);
1294 if ((buf_end - *buf_ptr) > s->buffer_size)
1297 s->buffer_size = buf_end - *buf_ptr;
1298 s->buffer = av_malloc(s->buffer_size + FF_INPUT_BUFFER_PADDING_SIZE);
1299 av_log(s->avctx, AV_LOG_DEBUG, "buffer too small, expanding to %d bytes\n",
1303 /* unescape buffer of SOS, use special treatment for JPEG-LS */
1304 if (start_code == SOS && !s->ls)
1306 const uint8_t *src = *buf_ptr;
1307 uint8_t *dst = s->buffer;
1311 uint8_t x = *(src++);
1314 if (s->avctx->codec_id != CODEC_ID_THP)
1317 while (src < buf_end && x == 0xff)
1320 if (x >= 0xd0 && x <= 0xd7)
1327 *unescaped_buf_ptr = s->buffer;
1328 *unescaped_buf_size = dst - s->buffer;
1330 av_log(s->avctx, AV_LOG_DEBUG, "escaping removed %td bytes\n",
1331 (buf_end - *buf_ptr) - (dst - s->buffer));
1333 else if(start_code == SOS && s->ls){
1334 const uint8_t *src = *buf_ptr;
1335 uint8_t *dst = s->buffer;
1343 while (src + t < buf_end){
1344 uint8_t x = src[t++];
1346 while((src + t < buf_end) && x == 0xff)
1356 init_put_bits(&pb, dst, t);
1358 /* unescape bitstream */
1360 uint8_t x = src[b++];
1361 put_bits(&pb, 8, x);
1364 put_bits(&pb, 7, x);
1368 flush_put_bits(&pb);
1370 *unescaped_buf_ptr = dst;
1371 *unescaped_buf_size = (bit_count + 7) >> 3;
1375 *unescaped_buf_ptr = *buf_ptr;
1376 *unescaped_buf_size = buf_end - *buf_ptr;
1382 int ff_mjpeg_decode_frame(AVCodecContext *avctx,
1383 void *data, int *data_size,
1386 const uint8_t *buf = avpkt->data;
1387 int buf_size = avpkt->size;
1388 MJpegDecodeContext *s = avctx->priv_data;
1389 const uint8_t *buf_end, *buf_ptr;
1390 const uint8_t *unescaped_buf_ptr;
1391 int unescaped_buf_size;
1393 AVFrame *picture = data;
1395 s->got_picture = 0; // picture from previous image can not be reused
1397 buf_end = buf + buf_size;
1398 while (buf_ptr < buf_end) {
1399 /* find start next marker */
1400 start_code = ff_mjpeg_find_marker(s, &buf_ptr, buf_end,
1401 &unescaped_buf_ptr, &unescaped_buf_size);
1404 if (start_code < 0) {
1407 av_log(avctx, AV_LOG_DEBUG, "marker=%x avail_size_in_buf=%td\n", start_code, buf_end - buf_ptr);
1409 init_get_bits(&s->gb, unescaped_buf_ptr, unescaped_buf_size*8);
1411 s->start_code = start_code;
1412 if(s->avctx->debug & FF_DEBUG_STARTCODE){
1413 av_log(avctx, AV_LOG_DEBUG, "startcode: %X\n", start_code);
1416 /* process markers */
1417 if (start_code >= 0xd0 && start_code <= 0xd7) {
1418 av_log(avctx, AV_LOG_DEBUG, "restart marker: %d\n", start_code&0x0f);
1420 } else if (start_code >= APP0 && start_code <= APP15) {
1421 mjpeg_decode_app(s);
1423 } else if (start_code == COM){
1424 mjpeg_decode_com(s);
1427 switch(start_code) {
1429 s->restart_interval = 0;
1431 s->restart_count = 0;
1432 /* nothing to do on SOI */
1435 ff_mjpeg_decode_dqt(s);
1438 if(ff_mjpeg_decode_dht(s) < 0){
1439 av_log(avctx, AV_LOG_ERROR, "huffman table decode error\n");
1448 if (ff_mjpeg_decode_sof(s) < 0)
1455 if (ff_mjpeg_decode_sof(s) < 0)
1462 if (ff_mjpeg_decode_sof(s) < 0)
1469 if (ff_mjpeg_decode_sof(s) < 0)
1473 if (!CONFIG_JPEGLS_DECODER || ff_jpegls_decode_lse(s) < 0)
1478 if ((s->buggy_avid && !s->interlaced) || s->restart_interval)
1481 if (!s->got_picture) {
1482 av_log(avctx, AV_LOG_WARNING, "Found EOI before any SOF, ignoring\n");
1485 if (s->interlaced) {
1486 s->bottom_field ^= 1;
1487 /* if not bottom field, do not output image yet */
1488 if (s->bottom_field == !s->interlace_polarity)
1491 *picture = *s->picture_ptr;
1492 *data_size = sizeof(AVFrame);
1495 picture->quality= FFMAX3(s->qscale[0], s->qscale[1], s->qscale[2]);
1496 picture->qstride= 0;
1497 picture->qscale_table= s->qscale_table;
1498 memset(picture->qscale_table, picture->quality, (s->width+15)/16);
1499 if(avctx->debug & FF_DEBUG_QP)
1500 av_log(avctx, AV_LOG_DEBUG, "QP: %d\n", picture->quality);
1501 picture->quality*= FF_QP2LAMBDA;
1506 if (!s->got_picture) {
1507 av_log(avctx, AV_LOG_WARNING, "Can not process SOS before SOF, skipping\n");
1510 if (ff_mjpeg_decode_sos(s, NULL, NULL) < 0 &&
1511 avctx->error_recognition >= FF_ER_EXPLODE)
1512 return AVERROR_INVALIDDATA;
1513 /* buggy avid puts EOI every 10-20th frame */
1514 /* if restart period is over process EOI */
1515 if ((s->buggy_avid && !s->interlaced) || s->restart_interval)
1519 mjpeg_decode_dri(s);
1531 av_log(avctx, AV_LOG_ERROR, "mjpeg: unsupported coding type (%x)\n", start_code);
1534 // printf("mjpeg: unsupported marker (%x)\n", start_code);
1539 /* eof process start code */
1540 buf_ptr += (get_bits_count(&s->gb)+7)/8;
1541 av_log(avctx, AV_LOG_DEBUG, "marker parser used %d bytes (%d bits)\n",
1542 (get_bits_count(&s->gb)+7)/8, get_bits_count(&s->gb));
1546 if (s->got_picture) {
1547 av_log(avctx, AV_LOG_WARNING, "EOI missing, emulating\n");
1550 av_log(avctx, AV_LOG_FATAL, "No JPEG data found in image\n");
1553 av_log(avctx, AV_LOG_DEBUG, "mjpeg decode frame unused %td bytes\n", buf_end - buf_ptr);
1554 // return buf_end - buf_ptr;
1555 return buf_ptr - buf;
1558 av_cold int ff_mjpeg_decode_end(AVCodecContext *avctx)
1560 MJpegDecodeContext *s = avctx->priv_data;
1563 if (s->picture_ptr && s->picture_ptr->data[0])
1564 avctx->release_buffer(avctx, s->picture_ptr);
1567 av_free(s->qscale_table);
1568 av_freep(&s->ljpeg_buffer);
1569 s->ljpeg_buffer_size=0;
1573 free_vlc(&s->vlcs[i][j]);
1575 for(i=0; i<MAX_COMPONENTS; i++) {
1576 av_freep(&s->blocks[i]);
1577 av_freep(&s->last_nnz[i]);
1582 AVCodec ff_mjpeg_decoder = {
1584 .type = AVMEDIA_TYPE_VIDEO,
1585 .id = CODEC_ID_MJPEG,
1586 .priv_data_size = sizeof(MJpegDecodeContext),
1587 .init = ff_mjpeg_decode_init,
1588 .close = ff_mjpeg_decode_end,
1589 .decode = ff_mjpeg_decode_frame,
1590 .capabilities = CODEC_CAP_DR1,
1592 .long_name = NULL_IF_CONFIG_SMALL("MJPEG (Motion JPEG)"),
1595 AVCodec ff_thp_decoder = {
1597 .type = AVMEDIA_TYPE_VIDEO,
1599 .priv_data_size = sizeof(MJpegDecodeContext),
1600 .init = ff_mjpeg_decode_init,
1601 .close = ff_mjpeg_decode_end,
1602 .decode = ff_mjpeg_decode_frame,
1603 .capabilities = CODEC_CAP_DR1,
1605 .long_name = NULL_IF_CONFIG_SMALL("Nintendo Gamecube THP video"),