2 * MJPEG encoder and decoder
3 * Copyright (c) 2000, 2001 Fabrice Bellard.
4 * Copyright (c) 2003 Alex Beregszaszi
5 * Copyright (c) 2003-2004 Michael Niedermayer
7 * This library is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2 of the License, or (at your option) any later version.
12 * This library is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with this library; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21 * Support for external huffman table, various fixes (AVID workaround),
22 * aspecting, new decode_frame mechanism and apple mjpeg-b support
23 * by Alex Beregszaszi <alex@naxine.org>
28 * MJPEG encoder and decoder.
36 #include "mpegvideo.h"
38 /* use two quantizer tables (one for luminance and one for chrominance) */
42 typedef struct MJpegContext {
43 uint8_t huff_size_dc_luminance[12]; //FIXME use array [3] instead of lumi / chrom, for easier addressing
44 uint16_t huff_code_dc_luminance[12];
45 uint8_t huff_size_dc_chrominance[12];
46 uint16_t huff_code_dc_chrominance[12];
48 uint8_t huff_size_ac_luminance[256];
49 uint16_t huff_code_ac_luminance[256];
50 uint8_t huff_size_ac_chrominance[256];
51 uint16_t huff_code_ac_chrominance[256];
54 /* JPEG marker codes */
57 SOF0 = 0xc0, /* baseline */
58 SOF1 = 0xc1, /* extended sequential, huffman */
59 SOF2 = 0xc2, /* progressive, huffman */
60 SOF3 = 0xc3, /* lossless, huffman */
62 SOF5 = 0xc5, /* differential sequential, huffman */
63 SOF6 = 0xc6, /* differential progressive, huffman */
64 SOF7 = 0xc7, /* differential lossless, huffman */
65 JPG = 0xc8, /* reserved for JPEG extension */
66 SOF9 = 0xc9, /* extended sequential, arithmetic */
67 SOF10 = 0xca, /* progressive, arithmetic */
68 SOF11 = 0xcb, /* lossless, arithmetic */
70 SOF13 = 0xcd, /* differential sequential, arithmetic */
71 SOF14 = 0xce, /* differential progressive, arithmetic */
72 SOF15 = 0xcf, /* differential lossless, arithmetic */
74 DHT = 0xc4, /* define huffman tables */
76 DAC = 0xcc, /* define arithmetic-coding conditioning */
78 /* restart with modulo 8 count "m" */
88 SOI = 0xd8, /* start of image */
89 EOI = 0xd9, /* end of image */
90 SOS = 0xda, /* start of scan */
91 DQT = 0xdb, /* define quantization tables */
92 DNL = 0xdc, /* define number of lines */
93 DRI = 0xdd, /* define restart interval */
94 DHP = 0xde, /* define hierarchical progression */
95 EXP = 0xdf, /* expand reference components */
121 SOF48 = 0xf7, ///< JPEG-LS
122 LSE = 0xf8, ///< JPEG-LS extension parameters
129 COM = 0xfe, /* comment */
131 TEM = 0x01, /* temporary private use for arithmetic coding */
133 /* 0x02 -> 0xbf reserved */
137 /* These are the sample quantization tables given in JPEG spec section K.1.
138 * The spec says that the values given produce "good" quality, and
139 * when divided by 2, "very good" quality.
141 static const unsigned char std_luminance_quant_tbl[64] = {
142 16, 11, 10, 16, 24, 40, 51, 61,
143 12, 12, 14, 19, 26, 58, 60, 55,
144 14, 13, 16, 24, 40, 57, 69, 56,
145 14, 17, 22, 29, 51, 87, 80, 62,
146 18, 22, 37, 56, 68, 109, 103, 77,
147 24, 35, 55, 64, 81, 104, 113, 92,
148 49, 64, 78, 87, 103, 121, 120, 101,
149 72, 92, 95, 98, 112, 100, 103, 99
151 static const unsigned char std_chrominance_quant_tbl[64] = {
152 17, 18, 24, 47, 99, 99, 99, 99,
153 18, 21, 26, 66, 99, 99, 99, 99,
154 24, 26, 56, 99, 99, 99, 99, 99,
155 47, 66, 99, 99, 99, 99, 99, 99,
156 99, 99, 99, 99, 99, 99, 99, 99,
157 99, 99, 99, 99, 99, 99, 99, 99,
158 99, 99, 99, 99, 99, 99, 99, 99,
159 99, 99, 99, 99, 99, 99, 99, 99
163 /* Set up the standard Huffman tables (cf. JPEG standard section K.3) */
164 /* IMPORTANT: these are only valid for 8-bit data precision! */
165 static const uint8_t bits_dc_luminance[17] =
166 { /* 0-base */ 0, 0, 1, 5, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0 };
167 static const uint8_t val_dc_luminance[] =
168 { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11 };
170 static const uint8_t bits_dc_chrominance[17] =
171 { /* 0-base */ 0, 0, 3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0 };
172 static const uint8_t val_dc_chrominance[] =
173 { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11 };
175 static const uint8_t bits_ac_luminance[17] =
176 { /* 0-base */ 0, 0, 2, 1, 3, 3, 2, 4, 3, 5, 5, 4, 4, 0, 0, 1, 0x7d };
177 static const uint8_t val_ac_luminance[] =
178 { 0x01, 0x02, 0x03, 0x00, 0x04, 0x11, 0x05, 0x12,
179 0x21, 0x31, 0x41, 0x06, 0x13, 0x51, 0x61, 0x07,
180 0x22, 0x71, 0x14, 0x32, 0x81, 0x91, 0xa1, 0x08,
181 0x23, 0x42, 0xb1, 0xc1, 0x15, 0x52, 0xd1, 0xf0,
182 0x24, 0x33, 0x62, 0x72, 0x82, 0x09, 0x0a, 0x16,
183 0x17, 0x18, 0x19, 0x1a, 0x25, 0x26, 0x27, 0x28,
184 0x29, 0x2a, 0x34, 0x35, 0x36, 0x37, 0x38, 0x39,
185 0x3a, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48, 0x49,
186 0x4a, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59,
187 0x5a, 0x63, 0x64, 0x65, 0x66, 0x67, 0x68, 0x69,
188 0x6a, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78, 0x79,
189 0x7a, 0x83, 0x84, 0x85, 0x86, 0x87, 0x88, 0x89,
190 0x8a, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, 0x98,
191 0x99, 0x9a, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7,
192 0xa8, 0xa9, 0xaa, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6,
193 0xb7, 0xb8, 0xb9, 0xba, 0xc2, 0xc3, 0xc4, 0xc5,
194 0xc6, 0xc7, 0xc8, 0xc9, 0xca, 0xd2, 0xd3, 0xd4,
195 0xd5, 0xd6, 0xd7, 0xd8, 0xd9, 0xda, 0xe1, 0xe2,
196 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, 0xe8, 0xe9, 0xea,
197 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, 0xf8,
201 static const uint8_t bits_ac_chrominance[17] =
202 { /* 0-base */ 0, 0, 2, 1, 2, 4, 4, 3, 4, 7, 5, 4, 4, 0, 1, 2, 0x77 };
204 static const uint8_t val_ac_chrominance[] =
205 { 0x00, 0x01, 0x02, 0x03, 0x11, 0x04, 0x05, 0x21,
206 0x31, 0x06, 0x12, 0x41, 0x51, 0x07, 0x61, 0x71,
207 0x13, 0x22, 0x32, 0x81, 0x08, 0x14, 0x42, 0x91,
208 0xa1, 0xb1, 0xc1, 0x09, 0x23, 0x33, 0x52, 0xf0,
209 0x15, 0x62, 0x72, 0xd1, 0x0a, 0x16, 0x24, 0x34,
210 0xe1, 0x25, 0xf1, 0x17, 0x18, 0x19, 0x1a, 0x26,
211 0x27, 0x28, 0x29, 0x2a, 0x35, 0x36, 0x37, 0x38,
212 0x39, 0x3a, 0x43, 0x44, 0x45, 0x46, 0x47, 0x48,
213 0x49, 0x4a, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58,
214 0x59, 0x5a, 0x63, 0x64, 0x65, 0x66, 0x67, 0x68,
215 0x69, 0x6a, 0x73, 0x74, 0x75, 0x76, 0x77, 0x78,
216 0x79, 0x7a, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87,
217 0x88, 0x89, 0x8a, 0x92, 0x93, 0x94, 0x95, 0x96,
218 0x97, 0x98, 0x99, 0x9a, 0xa2, 0xa3, 0xa4, 0xa5,
219 0xa6, 0xa7, 0xa8, 0xa9, 0xaa, 0xb2, 0xb3, 0xb4,
220 0xb5, 0xb6, 0xb7, 0xb8, 0xb9, 0xba, 0xc2, 0xc3,
221 0xc4, 0xc5, 0xc6, 0xc7, 0xc8, 0xc9, 0xca, 0xd2,
222 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, 0xd8, 0xd9, 0xda,
223 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, 0xe8, 0xe9,
224 0xea, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, 0xf8,
228 /* isn't this function nicer than the one in the libjpeg ? */
229 static void build_huffman_codes(uint8_t *huff_size, uint16_t *huff_code,
230 const uint8_t *bits_table, const uint8_t *val_table)
232 int i, j, k,nb, code, sym;
239 sym = val_table[k++];
241 huff_code[sym] = code;
248 #ifdef CONFIG_ENCODERS
249 int mjpeg_init(MpegEncContext *s)
253 m = av_malloc(sizeof(MJpegContext));
260 /* build all the huffman tables */
261 build_huffman_codes(m->huff_size_dc_luminance,
262 m->huff_code_dc_luminance,
265 build_huffman_codes(m->huff_size_dc_chrominance,
266 m->huff_code_dc_chrominance,
269 build_huffman_codes(m->huff_size_ac_luminance,
270 m->huff_code_ac_luminance,
273 build_huffman_codes(m->huff_size_ac_chrominance,
274 m->huff_code_ac_chrominance,
282 void mjpeg_close(MpegEncContext *s)
284 av_free(s->mjpeg_ctx);
286 #endif //CONFIG_ENCODERS
288 #define PREDICT(ret, topleft, top, left, predictor)\
290 case 1: ret= left; break;\
291 case 2: ret= top; break;\
292 case 3: ret= topleft; break;\
293 case 4: ret= left + top - topleft; break;\
294 case 5: ret= left + ((top - topleft)>>1); break;\
295 case 6: ret= top + ((left - topleft)>>1); break;\
297 case 7: ret= (left + top)>>1; break;\
300 #ifdef CONFIG_ENCODERS
301 static inline void put_marker(PutBitContext *p, int code)
303 put_bits(p, 8, 0xff);
304 put_bits(p, 8, code);
307 /* table_class: 0 = DC coef, 1 = AC coefs */
308 static int put_huffman_table(MpegEncContext *s, int table_class, int table_id,
309 const uint8_t *bits_table, const uint8_t *value_table)
311 PutBitContext *p = &s->pb;
314 put_bits(p, 4, table_class);
315 put_bits(p, 4, table_id);
320 put_bits(p, 8, bits_table[i]);
324 put_bits(p, 8, value_table[i]);
329 static void jpeg_table_header(MpegEncContext *s)
331 PutBitContext *p = &s->pb;
338 put_bits(p, 16, 2 + 2 * (1 + 64));
340 put_bits(p, 16, 2 + 1 * (1 + 64));
342 put_bits(p, 4, 0); /* 8 bit precision */
343 put_bits(p, 4, 0); /* table 0 */
345 j = s->intra_scantable.permutated[i];
346 put_bits(p, 8, s->intra_matrix[j]);
349 put_bits(p, 4, 0); /* 8 bit precision */
350 put_bits(p, 4, 1); /* table 1 */
352 j = s->intra_scantable.permutated[i];
353 put_bits(p, 8, s->chroma_intra_matrix[j]);
361 put_bits(p, 16, 0); /* patched later */
363 size += put_huffman_table(s, 0, 0, bits_dc_luminance, val_dc_luminance);
364 size += put_huffman_table(s, 0, 1, bits_dc_chrominance, val_dc_chrominance);
366 size += put_huffman_table(s, 1, 0, bits_ac_luminance, val_ac_luminance);
367 size += put_huffman_table(s, 1, 1, bits_ac_chrominance, val_ac_chrominance);
372 static void jpeg_put_comments(MpegEncContext *s)
374 PutBitContext *p = &s->pb;
378 if (s->aspect_ratio_info /* && !lossless */)
383 ff_put_string(p, "JFIF", 1); /* this puts the trailing zero-byte too */
384 put_bits(p, 16, 0x0201); /* v 1.02 */
385 put_bits(p, 8, 0); /* units type: 0 - aspect ratio */
386 put_bits(p, 16, s->avctx->sample_aspect_ratio.num);
387 put_bits(p, 16, s->avctx->sample_aspect_ratio.den);
388 put_bits(p, 8, 0); /* thumbnail width */
389 put_bits(p, 8, 0); /* thumbnail height */
393 if(!(s->flags & CODEC_FLAG_BITEXACT)){
397 put_bits(p, 16, 0); /* patched later */
398 ff_put_string(p, LIBAVCODEC_IDENT, 1);
399 size = strlen(LIBAVCODEC_IDENT)+3;
404 if( s->avctx->pix_fmt == PIX_FMT_YUV420P
405 ||s->avctx->pix_fmt == PIX_FMT_YUV422P
406 ||s->avctx->pix_fmt == PIX_FMT_YUV444P){
410 put_bits(p, 16, 0); /* patched later */
411 ff_put_string(p, "CS=ITU601", 1);
412 size = strlen("CS=ITU601")+3;
418 void mjpeg_picture_header(MpegEncContext *s)
420 const int lossless= s->avctx->codec_id != CODEC_ID_MJPEG;
421 const int ls = s->avctx->codec_id == CODEC_ID_JPEGLS;
423 assert(!(ls && s->mjpeg_write_tables));
425 put_marker(&s->pb, SOI);
427 if (!s->mjpeg_data_only_frames)
429 jpeg_put_comments(s);
431 if (s->mjpeg_write_tables) jpeg_table_header(s);
433 switch(s->avctx->codec_id){
434 case CODEC_ID_MJPEG: put_marker(&s->pb, SOF0 ); break;
435 case CODEC_ID_LJPEG: put_marker(&s->pb, SOF3 ); break;
436 case CODEC_ID_JPEGLS: put_marker(&s->pb, SOF48); break;
440 put_bits(&s->pb, 16, 17);
441 if(lossless && s->avctx->pix_fmt == PIX_FMT_RGBA32)
442 put_bits(&s->pb, 8, 9); /* 9 bits/component RCT */
444 put_bits(&s->pb, 8, 8); /* 8 bits/component */
445 put_bits(&s->pb, 16, s->height);
446 put_bits(&s->pb, 16, s->width);
447 put_bits(&s->pb, 8, 3); /* 3 components */
450 put_bits(&s->pb, 8, 1); /* component number */
451 put_bits(&s->pb, 4, s->mjpeg_hsample[0]); /* H factor */
452 put_bits(&s->pb, 4, s->mjpeg_vsample[0]); /* V factor */
453 put_bits(&s->pb, 8, 0); /* select matrix */
456 put_bits(&s->pb, 8, 2); /* component number */
457 put_bits(&s->pb, 4, s->mjpeg_hsample[1]); /* H factor */
458 put_bits(&s->pb, 4, s->mjpeg_vsample[1]); /* V factor */
460 put_bits(&s->pb, 8, lossless ? 0 : 1); /* select matrix */
462 put_bits(&s->pb, 8, 0); /* select matrix */
466 put_bits(&s->pb, 8, 3); /* component number */
467 put_bits(&s->pb, 4, s->mjpeg_hsample[2]); /* H factor */
468 put_bits(&s->pb, 4, s->mjpeg_vsample[2]); /* V factor */
470 put_bits(&s->pb, 8, lossless ? 0 : 1); /* select matrix */
472 put_bits(&s->pb, 8, 0); /* select matrix */
477 put_marker(&s->pb, SOS);
478 put_bits(&s->pb, 16, 12); /* length */
479 put_bits(&s->pb, 8, 3); /* 3 components */
482 put_bits(&s->pb, 8, 1); /* index */
483 put_bits(&s->pb, 4, 0); /* DC huffman table index */
484 put_bits(&s->pb, 4, 0); /* AC huffman table index */
487 put_bits(&s->pb, 8, 2); /* index */
488 put_bits(&s->pb, 4, 1); /* DC huffman table index */
489 put_bits(&s->pb, 4, lossless ? 0 : 1); /* AC huffman table index */
492 put_bits(&s->pb, 8, 3); /* index */
493 put_bits(&s->pb, 4, 1); /* DC huffman table index */
494 put_bits(&s->pb, 4, lossless ? 0 : 1); /* AC huffman table index */
496 put_bits(&s->pb, 8, (lossless && !ls) ? s->avctx->prediction_method+1 : 0); /* Ss (not used) */
498 switch(s->avctx->codec_id){
499 case CODEC_ID_MJPEG: put_bits(&s->pb, 8, 63); break; /* Se (not used) */
500 case CODEC_ID_LJPEG: put_bits(&s->pb, 8, 0); break; /* not used */
501 case CODEC_ID_JPEGLS: put_bits(&s->pb, 8, 1); break; /* ILV = line interleaved */
505 put_bits(&s->pb, 8, 0); /* Ah/Al (not used) */
507 //FIXME DC/AC entropy table selectors stuff in jpegls
510 static void escape_FF(MpegEncContext *s, int start)
512 int size= put_bits_count(&s->pb) - start*8;
514 uint8_t *buf= s->pb.buf + start;
515 int align= (-(size_t)(buf))&3;
517 assert((size&7) == 0);
521 for(i=0; i<size && i<align; i++){
522 if(buf[i]==0xFF) ff_count++;
524 for(; i<size-15; i+=16){
527 v= *(uint32_t*)(&buf[i]);
528 acc= (((v & (v>>4))&0x0F0F0F0F)+0x01010101)&0x10101010;
529 v= *(uint32_t*)(&buf[i+4]);
530 acc+=(((v & (v>>4))&0x0F0F0F0F)+0x01010101)&0x10101010;
531 v= *(uint32_t*)(&buf[i+8]);
532 acc+=(((v & (v>>4))&0x0F0F0F0F)+0x01010101)&0x10101010;
533 v= *(uint32_t*)(&buf[i+12]);
534 acc+=(((v & (v>>4))&0x0F0F0F0F)+0x01010101)&0x10101010;
542 if(buf[i]==0xFF) ff_count++;
545 if(ff_count==0) return;
548 for(i=0; i<ff_count-3; i+=4)
549 put_bits(&s->pb, 32, 0);
550 put_bits(&s->pb, (ff_count-i)*8, 0);
551 flush_put_bits(&s->pb);
553 for(i=size-1; ff_count; i--){
557 //printf("%d %d\n", i, ff_count);
566 void ff_mjpeg_stuffing(PutBitContext * pbc)
569 length= (-put_bits_count(pbc))&7;
570 if(length) put_bits(pbc, length, (1<<length)-1);
573 void mjpeg_picture_trailer(MpegEncContext *s)
575 ff_mjpeg_stuffing(&s->pb);
576 flush_put_bits(&s->pb);
578 assert((s->header_bits&7)==0);
580 escape_FF(s, s->header_bits>>3);
582 put_marker(&s->pb, EOI);
585 static inline void mjpeg_encode_dc(MpegEncContext *s, int val,
586 uint8_t *huff_size, uint16_t *huff_code)
591 put_bits(&s->pb, huff_size[0], huff_code[0]);
599 nbits= av_log2_16bit(val) + 1;
601 put_bits(&s->pb, huff_size[nbits], huff_code[nbits]);
603 put_bits(&s->pb, nbits, mant & ((1 << nbits) - 1));
607 static void encode_block(MpegEncContext *s, DCTELEM *block, int n)
609 int mant, nbits, code, i, j;
610 int component, dc, run, last_index, val;
611 MJpegContext *m = s->mjpeg_ctx;
612 uint8_t *huff_size_ac;
613 uint16_t *huff_code_ac;
616 component = (n <= 3 ? 0 : n - 4 + 1);
617 dc = block[0]; /* overflow is impossible */
618 val = dc - s->last_dc[component];
620 mjpeg_encode_dc(s, val, m->huff_size_dc_luminance, m->huff_code_dc_luminance);
621 huff_size_ac = m->huff_size_ac_luminance;
622 huff_code_ac = m->huff_code_ac_luminance;
624 mjpeg_encode_dc(s, val, m->huff_size_dc_chrominance, m->huff_code_dc_chrominance);
625 huff_size_ac = m->huff_size_ac_chrominance;
626 huff_code_ac = m->huff_code_ac_chrominance;
628 s->last_dc[component] = dc;
633 last_index = s->block_last_index[n];
634 for(i=1;i<=last_index;i++) {
635 j = s->intra_scantable.permutated[i];
641 put_bits(&s->pb, huff_size_ac[0xf0], huff_code_ac[0xf0]);
650 nbits= av_log2(val) + 1;
651 code = (run << 4) | nbits;
653 put_bits(&s->pb, huff_size_ac[code], huff_code_ac[code]);
655 put_bits(&s->pb, nbits, mant & ((1 << nbits) - 1));
660 /* output EOB only if not already 64 values */
661 if (last_index < 63 || run != 0)
662 put_bits(&s->pb, huff_size_ac[0], huff_code_ac[0]);
665 void mjpeg_encode_mb(MpegEncContext *s,
666 DCTELEM block[6][64])
670 encode_block(s, block[i], i);
674 static int encode_picture_lossless(AVCodecContext *avctx, unsigned char *buf, int buf_size, void *data){
675 MpegEncContext * const s = avctx->priv_data;
676 MJpegContext * const m = s->mjpeg_ctx;
677 AVFrame *pict = data;
678 const int width= s->width;
679 const int height= s->height;
680 AVFrame * const p= (AVFrame*)&s->current_picture;
681 const int predictor= avctx->prediction_method+1;
683 init_put_bits(&s->pb, buf, buf_size);
686 p->pict_type= FF_I_TYPE;
689 mjpeg_picture_header(s);
691 s->header_bits= put_bits_count(&s->pb);
693 if(avctx->pix_fmt == PIX_FMT_RGBA32){
695 const int linesize= p->linesize[0];
696 uint16_t (*buffer)[4]= (void *) s->rd_scratchpad;
697 int left[3], top[3], topleft[3];
700 buffer[0][i]= 1 << (9 - 1);
703 for(y = 0; y < height; y++) {
704 const int modified_predictor= y ? predictor : 1;
705 uint8_t *ptr = p->data[0] + (linesize * y);
707 if(s->pb.buf_end - s->pb.buf - (put_bits_count(&s->pb)>>3) < width*3*4){
708 av_log(s->avctx, AV_LOG_ERROR, "encoded frame too large\n");
713 top[i]= left[i]= topleft[i]= buffer[0][i];
715 for(x = 0; x < width; x++) {
716 buffer[x][1] = ptr[4*x+0] - ptr[4*x+1] + 0x100;
717 buffer[x][2] = ptr[4*x+2] - ptr[4*x+1] + 0x100;
718 buffer[x][0] = (ptr[4*x+0] + 2*ptr[4*x+1] + ptr[4*x+2])>>2;
723 PREDICT(pred, topleft[i], top[i], left[i], modified_predictor);
726 top[i]= buffer[x+1][i];
728 left[i]= buffer[x][i];
730 diff= ((left[i] - pred + 0x100)&0x1FF) - 0x100;
733 mjpeg_encode_dc(s, diff, m->huff_size_dc_luminance, m->huff_code_dc_luminance); //FIXME ugly
735 mjpeg_encode_dc(s, diff, m->huff_size_dc_chrominance, m->huff_code_dc_chrominance);
741 const int mb_width = (width + s->mjpeg_hsample[0] - 1) / s->mjpeg_hsample[0];
742 const int mb_height = (height + s->mjpeg_vsample[0] - 1) / s->mjpeg_vsample[0];
744 for(mb_y = 0; mb_y < mb_height; mb_y++) {
745 if(s->pb.buf_end - s->pb.buf - (put_bits_count(&s->pb)>>3) < mb_width * 4 * 3 * s->mjpeg_hsample[0] * s->mjpeg_vsample[0]){
746 av_log(s->avctx, AV_LOG_ERROR, "encoded frame too large\n");
749 for(mb_x = 0; mb_x < mb_width; mb_x++) {
750 if(mb_x==0 || mb_y==0){
753 int x, y, h, v, linesize;
754 h = s->mjpeg_hsample[i];
755 v = s->mjpeg_vsample[i];
756 linesize= p->linesize[i];
762 ptr = p->data[i] + (linesize * (v * mb_y + y)) + (h * mb_x + x); //FIXME optimize this crap
771 pred= ptr[-linesize];
773 PREDICT(pred, ptr[-linesize-1], ptr[-linesize], ptr[-1], predictor);
778 mjpeg_encode_dc(s, (int8_t)(*ptr - pred), m->huff_size_dc_luminance, m->huff_code_dc_luminance); //FIXME ugly
780 mjpeg_encode_dc(s, (int8_t)(*ptr - pred), m->huff_size_dc_chrominance, m->huff_code_dc_chrominance);
787 int x, y, h, v, linesize;
788 h = s->mjpeg_hsample[i];
789 v = s->mjpeg_vsample[i];
790 linesize= p->linesize[i];
796 ptr = p->data[i] + (linesize * (v * mb_y + y)) + (h * mb_x + x); //FIXME optimize this crap
797 //printf("%d %d %d %d %8X\n", mb_x, mb_y, x, y, ptr);
798 PREDICT(pred, ptr[-linesize-1], ptr[-linesize], ptr[-1], predictor);
801 mjpeg_encode_dc(s, (int8_t)(*ptr - pred), m->huff_size_dc_luminance, m->huff_code_dc_luminance); //FIXME ugly
803 mjpeg_encode_dc(s, (int8_t)(*ptr - pred), m->huff_size_dc_chrominance, m->huff_code_dc_chrominance);
814 mjpeg_picture_trailer(s);
817 flush_put_bits(&s->pb);
818 return pbBufPtr(&s->pb) - s->pb.buf;
819 // return (put_bits_count(&f->pb)+7)/8;
822 #endif //CONFIG_ENCODERS
824 /******************************************/
827 #define MAX_COMPONENTS 4
829 typedef struct MJpegDecodeContext {
830 AVCodecContext *avctx;
832 int mpeg_enc_ctx_allocated; /* true if decoding context allocated */
834 int start_code; /* current start code */
838 int16_t quant_matrixes[4][64];
840 int qscale[4]; ///< quantizer scale calculated from quant_matrixes
842 int org_height; /* size given at codec init */
843 int first_picture; /* true if decoding first picture */
844 int interlaced; /* true if interlaced */
845 int bottom_field; /* true if bottom field */
849 int rct; /* standard rct */
850 int pegasus_rct; /* pegasus reversible colorspace transform */
851 int bits; /* bits per component */
854 int near; ///< near lossless bound (si 0 for lossless)
856 int reset; ///< context halfing intervall ?rename
859 int mb_width, mb_height;
861 int component_id[MAX_COMPONENTS];
862 int h_count[MAX_COMPONENTS]; /* horizontal and vertical count for each component */
863 int v_count[MAX_COMPONENTS];
864 int comp_index[MAX_COMPONENTS];
865 int dc_index[MAX_COMPONENTS];
866 int ac_index[MAX_COMPONENTS];
867 int nb_blocks[MAX_COMPONENTS];
868 int h_scount[MAX_COMPONENTS];
869 int v_scount[MAX_COMPONENTS];
870 int h_max, v_max; /* maximum h and v counts */
871 int quant_index[4]; /* quant table index for each component */
872 int last_dc[MAX_COMPONENTS]; /* last DEQUANTIZED dc (XXX: am I right to do that ?) */
873 AVFrame picture; /* picture structure */
874 int linesize[MAX_COMPONENTS]; ///< linesize << interlaced
875 int8_t *qscale_table;
876 DCTELEM block[64] __align8;
878 void (*idct_put)(uint8_t *dest/*align 8*/, int line_size, DCTELEM *block/*align 16*/);
880 int restart_interval;
885 int interlace_polarity;
888 } MJpegDecodeContext;
890 #include "jpeg_ls.c" //FIXME make jpeg-ls more independant
892 static int mjpeg_decode_dht(MJpegDecodeContext *s);
894 static int build_vlc(VLC *vlc, const uint8_t *bits_table, const uint8_t *val_table,
895 int nb_codes, int use_static)
897 uint8_t huff_size[256];
898 uint16_t huff_code[256];
900 memset(huff_size, 0, sizeof(huff_size));
901 build_huffman_codes(huff_size, huff_code, bits_table, val_table);
903 return init_vlc(vlc, 9, nb_codes, huff_size, 1, 1, huff_code, 2, 2, use_static);
906 static int mjpeg_decode_init(AVCodecContext *avctx)
908 MJpegDecodeContext *s = avctx->priv_data;
910 memset(s, 0, sizeof(MJpegDecodeContext));
914 /* ugly way to get the idct & scantable FIXME */
915 memset(&s2, 0, sizeof(MpegEncContext));
917 // s2->out_format = FMT_MJPEG;
918 dsputil_init(&s2.dsp, avctx);
919 DCT_common_init(&s2);
921 s->scantable= s2.intra_scantable;
922 s->idct_put= s2.dsp.idct_put;
924 s->mpeg_enc_ctx_allocated = 0;
928 s->first_picture = 1;
929 s->org_height = avctx->coded_height;
931 build_vlc(&s->vlcs[0][0], bits_dc_luminance, val_dc_luminance, 12, 0);
932 build_vlc(&s->vlcs[0][1], bits_dc_chrominance, val_dc_chrominance, 12, 0);
933 build_vlc(&s->vlcs[1][0], bits_ac_luminance, val_ac_luminance, 251, 0);
934 build_vlc(&s->vlcs[1][1], bits_ac_chrominance, val_ac_chrominance, 251, 0);
936 if (avctx->flags & CODEC_FLAG_EXTERN_HUFF)
938 av_log(avctx, AV_LOG_INFO, "mjpeg: using external huffman table\n");
939 init_get_bits(&s->gb, avctx->extradata, avctx->extradata_size*8);
941 /* should check for error - but dunno */
949 * finds the end of the current frame in the bitstream.
950 * @return the position of the first byte of the next frame, or -1
952 static int find_frame_end(ParseContext *pc, const uint8_t *buf, int buf_size){
956 vop_found= pc->frame_start_found;
961 for(i=0; i<buf_size; i++){
962 state= (state<<8) | buf[i];
972 /* EOF considered as end of frame */
975 for(; i<buf_size; i++){
976 state= (state<<8) | buf[i];
978 pc->frame_start_found=0;
984 pc->frame_start_found= vop_found;
986 return END_NOT_FOUND;
989 static int jpeg_parse(AVCodecParserContext *s,
990 AVCodecContext *avctx,
991 uint8_t **poutbuf, int *poutbuf_size,
992 const uint8_t *buf, int buf_size)
994 ParseContext *pc = s->priv_data;
997 next= find_frame_end(pc, buf, buf_size);
999 if (ff_combine_frame(pc, next, (uint8_t **)&buf, &buf_size) < 0) {
1005 *poutbuf = (uint8_t *)buf;
1006 *poutbuf_size = buf_size;
1010 /* quantize tables */
1011 static int mjpeg_decode_dqt(MJpegDecodeContext *s)
1013 int len, index, i, j;
1015 len = get_bits(&s->gb, 16) - 2;
1018 /* only 8 bit precision handled */
1019 if (get_bits(&s->gb, 4) != 0)
1021 dprintf("dqt: 16bit precision\n");
1024 index = get_bits(&s->gb, 4);
1027 dprintf("index=%d\n", index);
1028 /* read quant table */
1030 j = s->scantable.permutated[i];
1031 s->quant_matrixes[index][j] = get_bits(&s->gb, 8);
1034 //XXX FIXME finetune, and perhaps add dc too
1035 s->qscale[index]= FFMAX(
1036 s->quant_matrixes[index][s->scantable.permutated[1]],
1037 s->quant_matrixes[index][s->scantable.permutated[8]]) >> 1;
1038 dprintf("qscale[%d]: %d\n", index, s->qscale[index]);
1045 /* decode huffman tables and build VLC decoders */
1046 static int mjpeg_decode_dht(MJpegDecodeContext *s)
1048 int len, index, i, class, n, v, code_max;
1049 uint8_t bits_table[17];
1050 uint8_t val_table[256];
1052 len = get_bits(&s->gb, 16) - 2;
1057 class = get_bits(&s->gb, 4);
1060 index = get_bits(&s->gb, 4);
1064 for(i=1;i<=16;i++) {
1065 bits_table[i] = get_bits(&s->gb, 8);
1069 if (len < n || n > 256)
1074 v = get_bits(&s->gb, 8);
1081 /* build VLC and flush previous vlc if present */
1082 free_vlc(&s->vlcs[class][index]);
1083 dprintf("class=%d index=%d nb_codes=%d\n",
1084 class, index, code_max + 1);
1085 if(build_vlc(&s->vlcs[class][index], bits_table, val_table, code_max + 1, 0) < 0){
1092 static int mjpeg_decode_sof(MJpegDecodeContext *s)
1094 int len, nb_components, i, width, height;
1096 /* XXX: verify len field validity */
1097 len = get_bits(&s->gb, 16);
1098 s->bits= get_bits(&s->gb, 8);
1100 if(s->pegasus_rct) s->bits=9;
1101 if(s->bits==9 && !s->pegasus_rct) s->rct=1; //FIXME ugly
1103 if (s->bits != 8 && !s->lossless){
1104 av_log(s->avctx, AV_LOG_ERROR, "only 8 bits/component accepted\n");
1107 height = get_bits(&s->gb, 16);
1108 width = get_bits(&s->gb, 16);
1110 dprintf("sof0: picture: %dx%d\n", width, height);
1111 if(avcodec_check_dimensions(s->avctx, width, height))
1114 nb_components = get_bits(&s->gb, 8);
1115 if (nb_components <= 0 ||
1116 nb_components > MAX_COMPONENTS)
1118 s->nb_components = nb_components;
1121 for(i=0;i<nb_components;i++) {
1123 s->component_id[i] = get_bits(&s->gb, 8) - 1;
1124 s->h_count[i] = get_bits(&s->gb, 4);
1125 s->v_count[i] = get_bits(&s->gb, 4);
1126 /* compute hmax and vmax (only used in interleaved case) */
1127 if (s->h_count[i] > s->h_max)
1128 s->h_max = s->h_count[i];
1129 if (s->v_count[i] > s->v_max)
1130 s->v_max = s->v_count[i];
1131 s->quant_index[i] = get_bits(&s->gb, 8);
1132 if (s->quant_index[i] >= 4)
1134 dprintf("component %d %d:%d id: %d quant:%d\n", i, s->h_count[i],
1135 s->v_count[i], s->component_id[i], s->quant_index[i]);
1138 if(s->v_max==1 && s->h_max==1 && s->lossless==1) s->rgb=1;
1140 /* if different size, realloc/alloc picture */
1141 /* XXX: also check h_count and v_count */
1142 if (width != s->width || height != s->height) {
1143 av_freep(&s->qscale_table);
1147 avcodec_set_dimensions(s->avctx, width, height);
1149 /* test interlaced mode */
1150 if (s->first_picture &&
1151 s->org_height != 0 &&
1152 s->height < ((s->org_height * 3) / 4)) {
1154 // s->bottom_field = (s->interlace_polarity) ? 1 : 0;
1155 s->bottom_field = 0;
1156 s->avctx->height *= 2;
1159 s->qscale_table= av_mallocz((s->width+15)/16);
1161 s->first_picture = 0;
1164 if(s->interlaced && s->bottom_field)
1167 /* XXX: not complete test ! */
1168 switch((s->h_count[0] << 4) | s->v_count[0]) {
1171 s->avctx->pix_fmt = PIX_FMT_RGBA32;
1172 }else if(s->nb_components==3)
1173 s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV444P : PIX_FMT_YUVJ444P;
1175 s->avctx->pix_fmt = PIX_FMT_GRAY8;
1178 s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV422P : PIX_FMT_YUVJ422P;
1182 s->avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV420P : PIX_FMT_YUVJ420P;
1186 if(s->picture.data[0])
1187 s->avctx->release_buffer(s->avctx, &s->picture);
1189 s->picture.reference= 0;
1190 if(s->avctx->get_buffer(s->avctx, &s->picture) < 0){
1191 av_log(s->avctx, AV_LOG_ERROR, "get_buffer() failed\n");
1194 s->picture.pict_type= I_TYPE;
1195 s->picture.key_frame= 1;
1198 s->linesize[i]= s->picture.linesize[i] << s->interlaced;
1201 // printf("%d %d %d %d %d %d\n", s->width, s->height, s->linesize[0], s->linesize[1], s->interlaced, s->avctx->height);
1203 if (len != (8+(3*nb_components)))
1205 dprintf("decode_sof0: error, len(%d) mismatch\n", len);
1211 static inline int mjpeg_decode_dc(MJpegDecodeContext *s, int dc_index)
1214 code = get_vlc2(&s->gb, s->vlcs[0][dc_index].table, 9, 2);
1217 dprintf("mjpeg_decode_dc: bad vlc: %d:%d (%p)\n", 0, dc_index,
1218 &s->vlcs[0][dc_index]);
1223 return get_xbits(&s->gb, code);
1228 /* decode block and dequantize */
1229 static int decode_block(MJpegDecodeContext *s, DCTELEM *block,
1230 int component, int dc_index, int ac_index, int quant_index)
1232 int code, i, j, level, val;
1234 int16_t *quant_matrix;
1237 val = mjpeg_decode_dc(s, dc_index);
1238 if (val == 0xffff) {
1239 dprintf("error dc\n");
1242 quant_matrix = s->quant_matrixes[quant_index];
1243 val = val * quant_matrix[0] + s->last_dc[component];
1244 s->last_dc[component] = val;
1247 ac_vlc = &s->vlcs[1][ac_index];
1250 code = get_vlc2(&s->gb, s->vlcs[1][ac_index].table, 9, 2);
1253 dprintf("error ac\n");
1262 level = get_xbits(&s->gb, code & 0xf);
1265 dprintf("error count: %d\n", i);
1268 j = s->scantable.permutated[i];
1269 block[j] = level * quant_matrix[j];
1278 static int ljpeg_decode_rgb_scan(MJpegDecodeContext *s, int predictor, int point_transform){
1280 uint16_t buffer[32768][4];
1281 int left[3], top[3], topleft[3];
1282 const int linesize= s->linesize[0];
1283 const int mask= (1<<s->bits)-1;
1285 if((unsigned)s->mb_width > 32768) //dynamic alloc
1289 buffer[0][i]= 1 << (s->bits + point_transform - 1);
1291 for(mb_y = 0; mb_y < s->mb_height; mb_y++) {
1292 const int modified_predictor= mb_y ? predictor : 1;
1293 uint8_t *ptr = s->picture.data[0] + (linesize * mb_y);
1295 if (s->interlaced && s->bottom_field)
1296 ptr += linesize >> 1;
1299 top[i]= left[i]= topleft[i]= buffer[0][i];
1301 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
1302 if (s->restart_interval && !s->restart_count)
1303 s->restart_count = s->restart_interval;
1309 top[i]= buffer[mb_x][i];
1311 PREDICT(pred, topleft[i], top[i], left[i], modified_predictor);
1314 buffer[mb_x][i]= mask & (pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform));
1317 if (s->restart_interval && !--s->restart_count) {
1318 align_get_bits(&s->gb);
1319 skip_bits(&s->gb, 16); /* skip RSTn */
1324 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
1325 ptr[4*mb_x+1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2] - 0x200)>>2);
1326 ptr[4*mb_x+0] = buffer[mb_x][1] + ptr[4*mb_x+1];
1327 ptr[4*mb_x+2] = buffer[mb_x][2] + ptr[4*mb_x+1];
1329 }else if(s->pegasus_rct){
1330 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
1331 ptr[4*mb_x+1] = buffer[mb_x][0] - ((buffer[mb_x][1] + buffer[mb_x][2])>>2);
1332 ptr[4*mb_x+0] = buffer[mb_x][1] + ptr[4*mb_x+1];
1333 ptr[4*mb_x+2] = buffer[mb_x][2] + ptr[4*mb_x+1];
1336 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
1337 ptr[4*mb_x+0] = buffer[mb_x][0];
1338 ptr[4*mb_x+1] = buffer[mb_x][1];
1339 ptr[4*mb_x+2] = buffer[mb_x][2];
1346 static int ljpeg_decode_yuv_scan(MJpegDecodeContext *s, int predictor, int point_transform){
1348 const int nb_components=3;
1350 for(mb_y = 0; mb_y < s->mb_height; mb_y++) {
1351 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
1352 if (s->restart_interval && !s->restart_count)
1353 s->restart_count = s->restart_interval;
1355 if(mb_x==0 || mb_y==0 || s->interlaced){
1356 for(i=0;i<nb_components;i++) {
1358 int n, h, v, x, y, c, j, linesize;
1359 n = s->nb_blocks[i];
1360 c = s->comp_index[i];
1365 linesize= s->linesize[c];
1367 for(j=0; j<n; j++) {
1370 ptr = s->picture.data[c] + (linesize * (v * mb_y + y)) + (h * mb_x + x); //FIXME optimize this crap
1371 if(y==0 && mb_y==0){
1372 if(x==0 && mb_x==0){
1373 pred= 128 << point_transform;
1378 if(x==0 && mb_x==0){
1379 pred= ptr[-linesize];
1381 PREDICT(pred, ptr[-linesize-1], ptr[-linesize], ptr[-1], predictor);
1385 if (s->interlaced && s->bottom_field)
1386 ptr += linesize >> 1;
1387 *ptr= pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform);
1396 for(i=0;i<nb_components;i++) {
1398 int n, h, v, x, y, c, j, linesize;
1399 n = s->nb_blocks[i];
1400 c = s->comp_index[i];
1405 linesize= s->linesize[c];
1407 for(j=0; j<n; j++) {
1410 ptr = s->picture.data[c] + (linesize * (v * mb_y + y)) + (h * mb_x + x); //FIXME optimize this crap
1411 PREDICT(pred, ptr[-linesize-1], ptr[-linesize], ptr[-1], predictor);
1412 *ptr= pred + (mjpeg_decode_dc(s, s->dc_index[i]) << point_transform);
1420 if (s->restart_interval && !--s->restart_count) {
1421 align_get_bits(&s->gb);
1422 skip_bits(&s->gb, 16); /* skip RSTn */
1429 static int mjpeg_decode_scan(MJpegDecodeContext *s){
1431 const int nb_components=3;
1433 for(mb_y = 0; mb_y < s->mb_height; mb_y++) {
1434 for(mb_x = 0; mb_x < s->mb_width; mb_x++) {
1435 if (s->restart_interval && !s->restart_count)
1436 s->restart_count = s->restart_interval;
1438 for(i=0;i<nb_components;i++) {
1440 int n, h, v, x, y, c, j;
1441 n = s->nb_blocks[i];
1442 c = s->comp_index[i];
1448 memset(s->block, 0, sizeof(s->block));
1449 if (decode_block(s, s->block, i,
1450 s->dc_index[i], s->ac_index[i],
1451 s->quant_index[c]) < 0) {
1452 dprintf("error y=%d x=%d\n", mb_y, mb_x);
1455 // dprintf("mb: %d %d processed\n", mb_y, mb_x);
1456 ptr = s->picture.data[c] +
1457 (((s->linesize[c] * (v * mb_y + y) * 8) +
1458 (h * mb_x + x) * 8) >> s->avctx->lowres);
1459 if (s->interlaced && s->bottom_field)
1460 ptr += s->linesize[c] >> 1;
1461 //av_log(NULL, AV_LOG_DEBUG, "%d %d %d %d %d %d %d %d \n", mb_x, mb_y, x, y, c, s->bottom_field, (v * mb_y + y) * 8, (h * mb_x + x) * 8);
1462 s->idct_put(ptr, s->linesize[c], s->block);
1469 /* (< 1350) buggy workaround for Spectralfan.mov, should be fixed */
1470 if (s->restart_interval && (s->restart_interval < 1350) &&
1471 !--s->restart_count) {
1472 align_get_bits(&s->gb);
1473 skip_bits(&s->gb, 16); /* skip RSTn */
1474 for (i=0; i<nb_components; i++) /* reset dc */
1475 s->last_dc[i] = 1024;
1482 static int mjpeg_decode_sos(MJpegDecodeContext *s)
1484 int len, nb_components, i, h, v, predictor, point_transform;
1485 int vmax, hmax, index, id;
1486 const int block_size= s->lossless ? 1 : 8;
1489 /* XXX: verify len field validity */
1490 len = get_bits(&s->gb, 16);
1491 nb_components = get_bits(&s->gb, 8);
1492 if (len != 6+2*nb_components)
1494 dprintf("decode_sos: invalid len (%d)\n", len);
1497 /* XXX: only interleaved scan accepted */
1498 if (nb_components != s->nb_components)
1500 dprintf("decode_sos: components(%d) mismatch\n", nb_components);
1505 for(i=0;i<nb_components;i++) {
1506 id = get_bits(&s->gb, 8) - 1;
1507 dprintf("component: %d\n", id);
1508 /* find component index */
1509 for(index=0;index<s->nb_components;index++)
1510 if (id == s->component_id[index])
1512 if (index == s->nb_components)
1514 dprintf("decode_sos: index(%d) out of components\n", index);
1518 s->comp_index[i] = index;
1520 s->nb_blocks[i] = s->h_count[index] * s->v_count[index];
1521 s->h_scount[i] = s->h_count[index];
1522 s->v_scount[i] = s->v_count[index];
1524 s->dc_index[i] = get_bits(&s->gb, 4);
1525 s->ac_index[i] = get_bits(&s->gb, 4);
1527 if (s->dc_index[i] < 0 || s->ac_index[i] < 0 ||
1528 s->dc_index[i] >= 4 || s->ac_index[i] >= 4)
1531 switch(s->start_code)
1534 if (dc_index[i] > 1 || ac_index[i] > 1)
1539 if (dc_index[i] > 3 || ac_index[i] > 3)
1543 if (dc_index[i] > 3 || ac_index[i] != 0)
1550 predictor= get_bits(&s->gb, 8); /* JPEG Ss / lossless JPEG predictor /JPEG-LS NEAR */
1551 ilv= get_bits(&s->gb, 8); /* JPEG Se / JPEG-LS ILV */
1552 skip_bits(&s->gb, 4); /* Ah */
1553 point_transform= get_bits(&s->gb, 4); /* Al */
1555 for(i=0;i<nb_components;i++)
1556 s->last_dc[i] = 1024;
1558 if (nb_components > 1) {
1559 /* interleaved stream */
1560 s->mb_width = (s->width + s->h_max * block_size - 1) / (s->h_max * block_size);
1561 s->mb_height = (s->height + s->v_max * block_size - 1) / (s->v_max * block_size);
1563 h = s->h_max / s->h_scount[s->comp_index[0]];
1564 v = s->v_max / s->v_scount[s->comp_index[0]];
1565 s->mb_width = (s->width + h * block_size - 1) / (h * block_size);
1566 s->mb_height = (s->height + v * block_size - 1) / (v * block_size);
1567 s->nb_blocks[0] = 1;
1572 if(s->avctx->debug & FF_DEBUG_PICT_INFO)
1573 av_log(s->avctx, AV_LOG_DEBUG, "%s %s p:%d >>:%d ilv:%d bits:%d %s\n", s->lossless ? "lossless" : "sequencial DCT", s->rgb ? "RGB" : "",
1574 predictor, point_transform, ilv, s->bits,
1575 s->pegasus_rct ? "PRCT" : (s->rct ? "RCT" : ""));
1578 /* mjpeg-b can have padding bytes between sos and image data, skip them */
1579 for (i = s->mjpb_skiptosod; i > 0; i--)
1580 skip_bits(&s->gb, 8);
1587 if(ljpeg_decode_rgb_scan(s, predictor, point_transform) < 0)
1590 if(ljpeg_decode_yuv_scan(s, predictor, point_transform) < 0)
1595 if(mjpeg_decode_scan(s) < 0)
1601 dprintf("decode_sos: ac/dc index out of range\n");
1605 static int mjpeg_decode_dri(MJpegDecodeContext *s)
1607 if (get_bits(&s->gb, 16) != 4)
1609 s->restart_interval = get_bits(&s->gb, 16);
1610 s->restart_count = 0;
1611 dprintf("restart interval: %d\n", s->restart_interval);
1616 static int mjpeg_decode_app(MJpegDecodeContext *s)
1620 len = get_bits(&s->gb, 16);
1623 if(8*len + get_bits_count(&s->gb) > s->gb.size_in_bits)
1626 id = (get_bits(&s->gb, 16) << 16) | get_bits(&s->gb, 16);
1630 if(s->avctx->debug & FF_DEBUG_STARTCODE){
1631 av_log(s->avctx, AV_LOG_DEBUG, "APPx %8X\n", id);
1634 /* buggy AVID, it puts EOI only at every 10th frame */
1635 /* also this fourcc is used by non-avid files too, it holds some
1636 informations, but it's always present in AVID creates files */
1637 if (id == ff_get_fourcc("AVI1"))
1644 4bytes field_size_less_padding
1647 // if (s->first_picture)
1648 // printf("mjpeg: workarounding buggy AVID\n");
1649 s->interlace_polarity = get_bits(&s->gb, 8);
1651 skip_bits(&s->gb, 8);
1652 skip_bits(&s->gb, 32);
1653 skip_bits(&s->gb, 32);
1656 // if (s->interlace_polarity)
1657 // printf("mjpeg: interlace polarity: %d\n", s->interlace_polarity);
1663 if (id == ff_get_fourcc("JFIF"))
1665 int t_w, t_h, v1, v2;
1666 skip_bits(&s->gb, 8); /* the trailing zero-byte */
1667 v1= get_bits(&s->gb, 8);
1668 v2= get_bits(&s->gb, 8);
1669 skip_bits(&s->gb, 8);
1671 s->avctx->sample_aspect_ratio.num= get_bits(&s->gb, 16);
1672 s->avctx->sample_aspect_ratio.den= get_bits(&s->gb, 16);
1674 if (s->avctx->debug & FF_DEBUG_PICT_INFO)
1675 av_log(s->avctx, AV_LOG_INFO, "mjpeg: JFIF header found (version: %x.%x) SAR=%d/%d\n",
1677 s->avctx->sample_aspect_ratio.num,
1678 s->avctx->sample_aspect_ratio.den
1681 t_w = get_bits(&s->gb, 8);
1682 t_h = get_bits(&s->gb, 8);
1685 /* skip thumbnail */
1686 if (len-10-(t_w*t_h*3) > 0)
1693 if (id == ff_get_fourcc("Adob") && (get_bits(&s->gb, 8) == 'e'))
1695 if (s->avctx->debug & FF_DEBUG_PICT_INFO)
1696 av_log(s->avctx, AV_LOG_INFO, "mjpeg: Adobe header found\n");
1697 skip_bits(&s->gb, 16); /* version */
1698 skip_bits(&s->gb, 16); /* flags0 */
1699 skip_bits(&s->gb, 16); /* flags1 */
1700 skip_bits(&s->gb, 8); /* transform */
1705 if (id == ff_get_fourcc("LJIF")){
1706 if (s->avctx->debug & FF_DEBUG_PICT_INFO)
1707 av_log(s->avctx, AV_LOG_INFO, "Pegasus lossless jpeg header found\n");
1708 skip_bits(&s->gb, 16); /* version ? */
1709 skip_bits(&s->gb, 16); /* unknwon always 0? */
1710 skip_bits(&s->gb, 16); /* unknwon always 0? */
1711 skip_bits(&s->gb, 16); /* unknwon always 0? */
1712 switch( get_bits(&s->gb, 8)){
1722 av_log(s->avctx, AV_LOG_ERROR, "unknown colorspace\n");
1729 if ((s->start_code == APP1) && (len > (0x28 - 8)))
1731 id = (get_bits(&s->gb, 16) << 16) | get_bits(&s->gb, 16);
1734 if (id == ff_get_fourcc("mjpg")) /* Apple MJPEG-A */
1737 skip_bits(&s->gb, 32); /* field size */
1738 skip_bits(&s->gb, 32); /* pad field size */
1739 skip_bits(&s->gb, 32); /* next off */
1740 skip_bits(&s->gb, 32); /* quant off */
1741 skip_bits(&s->gb, 32); /* huff off */
1742 skip_bits(&s->gb, 32); /* image off */
1743 skip_bits(&s->gb, 32); /* scan off */
1744 skip_bits(&s->gb, 32); /* data off */
1746 if (s->avctx->debug & FF_DEBUG_PICT_INFO)
1747 av_log(s->avctx, AV_LOG_INFO, "mjpeg: Apple MJPEG-A header found\n");
1752 /* slow but needed for extreme adobe jpegs */
1754 av_log(s->avctx, AV_LOG_ERROR, "mjpeg: error, decode_app parser read over the end\n");
1756 skip_bits(&s->gb, 8);
1761 static int mjpeg_decode_com(MJpegDecodeContext *s)
1763 int len = get_bits(&s->gb, 16);
1764 if (len >= 2 && 8*len - 16 + get_bits_count(&s->gb) <= s->gb.size_in_bits) {
1765 uint8_t *cbuf = av_malloc(len - 1);
1768 for (i = 0; i < len - 2; i++)
1769 cbuf[i] = get_bits(&s->gb, 8);
1770 if (i > 0 && cbuf[i-1] == '\n')
1775 if(s->avctx->debug & FF_DEBUG_PICT_INFO)
1776 av_log(s->avctx, AV_LOG_INFO, "mjpeg comment: '%s'\n", cbuf);
1778 /* buggy avid, it puts EOI only at every 10th frame */
1779 if (!strcmp(cbuf, "AVID"))
1782 // if (s->first_picture)
1783 // printf("mjpeg: workarounding buggy AVID\n");
1785 else if(!strcmp(cbuf, "CS=ITU601")){
1797 static int valid_marker_list[] =
1799 /* 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, a, b, c, d, e, f */
1800 /* 0 */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1801 /* 1 */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1802 /* 2 */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1803 /* 3 */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1804 /* 4 */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1805 /* 5 */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1806 /* 6 */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1807 /* 7 */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1808 /* 8 */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1809 /* 9 */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1810 /* a */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1811 /* b */ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1812 /* c */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1813 /* d */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1814 /* e */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
1815 /* f */ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0,
1819 /* return the 8 bit start code value and update the search
1820 state. Return -1 if no start code found */
1821 static int find_marker(uint8_t **pbuf_ptr, uint8_t *buf_end)
1830 buf_ptr = *pbuf_ptr;
1831 while (buf_ptr < buf_end) {
1834 if ((v == 0xff) && (v2 >= 0xc0) && (v2 <= 0xfe) && buf_ptr < buf_end) {
1845 dprintf("find_marker skipped %d bytes\n", skipped);
1847 *pbuf_ptr = buf_ptr;
1851 static int mjpeg_decode_frame(AVCodecContext *avctx,
1852 void *data, int *data_size,
1853 uint8_t *buf, int buf_size)
1855 MJpegDecodeContext *s = avctx->priv_data;
1856 uint8_t *buf_end, *buf_ptr;
1858 AVFrame *picture = data;
1861 buf_end = buf + buf_size;
1862 while (buf_ptr < buf_end) {
1863 /* find start next marker */
1864 start_code = find_marker(&buf_ptr, buf_end);
1867 if (start_code < 0) {
1870 dprintf("marker=%x avail_size_in_buf=%d\n", start_code, buf_end - buf_ptr);
1872 if ((buf_end - buf_ptr) > s->buffer_size)
1875 s->buffer_size = buf_end-buf_ptr;
1876 s->buffer = av_malloc(s->buffer_size + FF_INPUT_BUFFER_PADDING_SIZE);
1877 dprintf("buffer too small, expanding to %d bytes\n",
1881 /* unescape buffer of SOS */
1882 if (start_code == SOS)
1884 uint8_t *src = buf_ptr;
1885 uint8_t *dst = s->buffer;
1889 uint8_t x = *(src++);
1894 while(src<buf_end && x == 0xff)
1897 if (x >= 0xd0 && x <= 0xd7)
1903 init_get_bits(&s->gb, s->buffer, (dst - s->buffer)*8);
1905 dprintf("escaping removed %d bytes\n",
1906 (buf_end - buf_ptr) - (dst - s->buffer));
1909 init_get_bits(&s->gb, buf_ptr, (buf_end - buf_ptr)*8);
1911 s->start_code = start_code;
1912 if(s->avctx->debug & FF_DEBUG_STARTCODE){
1913 av_log(s->avctx, AV_LOG_DEBUG, "startcode: %X\n", start_code);
1916 /* process markers */
1917 if (start_code >= 0xd0 && start_code <= 0xd7) {
1918 dprintf("restart marker: %d\n", start_code&0x0f);
1920 } else if (start_code >= APP0 && start_code <= APP15) {
1921 mjpeg_decode_app(s);
1923 } else if (start_code == COM){
1924 mjpeg_decode_com(s);
1927 switch(start_code) {
1929 s->restart_interval = 0;
1930 reset_ls_coding_parameters(s, 1);
1932 s->restart_count = 0;
1933 /* nothing to do on SOI */
1936 mjpeg_decode_dqt(s);
1939 if(mjpeg_decode_dht(s) < 0){
1940 av_log(s->avctx, AV_LOG_ERROR, "huffman table decode error\n");
1946 if (mjpeg_decode_sof(s) < 0)
1951 if (mjpeg_decode_sof(s) < 0)
1957 if (mjpeg_decode_sof(s) < 0)
1961 if (decode_lse(s) < 0)
1965 if ((s->buggy_avid && !s->interlaced) || s->restart_interval)
1969 if (s->interlaced) {
1970 s->bottom_field ^= 1;
1971 /* if not bottom field, do not output image yet */
1972 if (s->bottom_field)
1975 *picture = s->picture;
1976 *data_size = sizeof(AVFrame);
1979 picture->quality= FFMAX(FFMAX(s->qscale[0], s->qscale[1]), s->qscale[2]);
1980 picture->qstride= 0;
1981 picture->qscale_table= s->qscale_table;
1982 memset(picture->qscale_table, picture->quality, (s->width+15)/16);
1983 if(avctx->debug & FF_DEBUG_QP)
1984 av_log(s->avctx, AV_LOG_DEBUG, "QP: %d\n", picture->quality);
1985 picture->quality*= FF_QP2LAMBDA;
1992 mjpeg_decode_sos(s);
1993 /* buggy avid puts EOI every 10-20th frame */
1994 /* if restart period is over process EOI */
1995 if ((s->buggy_avid && !s->interlaced) || s->restart_interval)
1999 mjpeg_decode_dri(s);
2013 av_log(s->avctx, AV_LOG_ERROR, "mjpeg: unsupported coding type (%x)\n", start_code);
2016 // printf("mjpeg: unsupported marker (%x)\n", start_code);
2021 /* eof process start code */
2022 buf_ptr += (get_bits_count(&s->gb)+7)/8;
2023 dprintf("marker parser used %d bytes (%d bits)\n",
2024 (get_bits_count(&s->gb)+7)/8, get_bits_count(&s->gb));
2029 dprintf("mjpeg decode frame unused %d bytes\n", buf_end - buf_ptr);
2030 // return buf_end - buf_ptr;
2031 return buf_ptr - buf;
2034 static int mjpegb_decode_frame(AVCodecContext *avctx,
2035 void *data, int *data_size,
2036 uint8_t *buf, int buf_size)
2038 MJpegDecodeContext *s = avctx->priv_data;
2039 uint8_t *buf_end, *buf_ptr;
2040 AVFrame *picture = data;
2041 GetBitContext hgb; /* for the header */
2042 uint32_t dqt_offs, dht_offs, sof_offs, sos_offs, second_field_offs;
2043 uint32_t field_size, sod_offs;
2046 buf_end = buf + buf_size;
2049 /* reset on every SOI */
2050 s->restart_interval = 0;
2051 s->restart_count = 0;
2052 s->mjpb_skiptosod = 0;
2054 init_get_bits(&hgb, buf_ptr, /*buf_size*/(buf_end - buf_ptr)*8);
2056 skip_bits(&hgb, 32); /* reserved zeros */
2058 if (get_bits_long(&hgb, 32) != be2me_32(ff_get_fourcc("mjpg")))
2060 dprintf("not mjpeg-b (bad fourcc)\n");
2064 field_size = get_bits_long(&hgb, 32); /* field size */
2065 dprintf("field size: 0x%x\n", field_size);
2066 skip_bits(&hgb, 32); /* padded field size */
2067 second_field_offs = get_bits_long(&hgb, 32);
2068 dprintf("second field offs: 0x%x\n", second_field_offs);
2069 if (second_field_offs)
2072 dqt_offs = get_bits_long(&hgb, 32);
2073 dprintf("dqt offs: 0x%x\n", dqt_offs);
2076 init_get_bits(&s->gb, buf+dqt_offs, (buf_end - (buf+dqt_offs))*8);
2077 s->start_code = DQT;
2078 mjpeg_decode_dqt(s);
2081 dht_offs = get_bits_long(&hgb, 32);
2082 dprintf("dht offs: 0x%x\n", dht_offs);
2085 init_get_bits(&s->gb, buf+dht_offs, (buf_end - (buf+dht_offs))*8);
2086 s->start_code = DHT;
2087 mjpeg_decode_dht(s);
2090 sof_offs = get_bits_long(&hgb, 32);
2091 dprintf("sof offs: 0x%x\n", sof_offs);
2094 init_get_bits(&s->gb, buf+sof_offs, (buf_end - (buf+sof_offs))*8);
2095 s->start_code = SOF0;
2096 if (mjpeg_decode_sof(s) < 0)
2100 sos_offs = get_bits_long(&hgb, 32);
2101 dprintf("sos offs: 0x%x\n", sos_offs);
2102 sod_offs = get_bits_long(&hgb, 32);
2103 dprintf("sod offs: 0x%x\n", sod_offs);
2106 // init_get_bits(&s->gb, buf+sos_offs, (buf_end - (buf+sos_offs))*8);
2107 init_get_bits(&s->gb, buf+sos_offs, field_size*8);
2108 s->mjpb_skiptosod = (sod_offs - sos_offs - show_bits(&s->gb, 16));
2109 s->start_code = SOS;
2110 mjpeg_decode_sos(s);
2113 if (s->interlaced) {
2114 s->bottom_field ^= 1;
2115 /* if not bottom field, do not output image yet */
2116 if (s->bottom_field && second_field_offs)
2118 buf_ptr = buf + second_field_offs;
2119 second_field_offs = 0;
2124 //XXX FIXME factorize, this looks very similar to the EOI code
2126 *picture= s->picture;
2127 *data_size = sizeof(AVFrame);
2130 picture->quality= FFMAX(FFMAX(s->qscale[0], s->qscale[1]), s->qscale[2]);
2131 picture->qstride= 0;
2132 picture->qscale_table= s->qscale_table;
2133 memset(picture->qscale_table, picture->quality, (s->width+15)/16);
2134 if(avctx->debug & FF_DEBUG_QP)
2135 av_log(avctx, AV_LOG_DEBUG, "QP: %d\n", picture->quality);
2136 picture->quality*= FF_QP2LAMBDA;
2139 return buf_ptr - buf;
2144 static int sp5x_decode_frame(AVCodecContext *avctx,
2145 void *data, int *data_size,
2146 uint8_t *buf, int buf_size)
2149 MJpegDecodeContext *s = avctx->priv_data;
2151 const int qscale = 5;
2152 uint8_t *buf_ptr, *buf_end, *recoded;
2155 if (!avctx->width || !avctx->height)
2159 buf_end = buf + buf_size;
2162 recoded = av_mallocz(buf_size + 1024);
2167 recoded[j++] = 0xFF;
2168 recoded[j++] = 0xD8;
2170 memcpy(recoded+j, &sp5x_data_dqt[0], sizeof(sp5x_data_dqt));
2171 memcpy(recoded+j+5, &sp5x_quant_table[qscale * 2], 64);
2172 memcpy(recoded+j+70, &sp5x_quant_table[(qscale * 2) + 1], 64);
2173 j += sizeof(sp5x_data_dqt);
2175 memcpy(recoded+j, &sp5x_data_dht[0], sizeof(sp5x_data_dht));
2176 j += sizeof(sp5x_data_dht);
2178 memcpy(recoded+j, &sp5x_data_sof[0], sizeof(sp5x_data_sof));
2179 recoded[j+5] = (avctx->coded_height >> 8) & 0xFF;
2180 recoded[j+6] = avctx->coded_height & 0xFF;
2181 recoded[j+7] = (avctx->coded_width >> 8) & 0xFF;
2182 recoded[j+8] = avctx->coded_width & 0xFF;
2183 j += sizeof(sp5x_data_sof);
2185 memcpy(recoded+j, &sp5x_data_sos[0], sizeof(sp5x_data_sos));
2186 j += sizeof(sp5x_data_sos);
2188 for (i = 14; i < buf_size && j < buf_size+1024-2; i++)
2190 recoded[j++] = buf[i];
2196 recoded[j++] = 0xFF;
2197 recoded[j++] = 0xD9;
2199 i = mjpeg_decode_frame(avctx, data, data_size, recoded, j);
2206 s->width = avctx->coded_width;
2207 s->height = avctx->coded_height;
2208 s->nb_components = 3;
2209 s->component_id[0] = 0;
2212 s->quant_index[0] = 0;
2213 s->component_id[1] = 1;
2216 s->quant_index[1] = 1;
2217 s->component_id[2] = 2;
2220 s->quant_index[2] = 1;
2224 s->qscale_table = av_mallocz((s->width+15)/16);
2225 avctx->pix_fmt = s->cs_itu601 ? PIX_FMT_YUV420P : PIX_FMT_YUVJ420;
2228 s->picture.reference = 0;
2229 if (avctx->get_buffer(avctx, &s->picture) < 0)
2231 av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n");
2235 s->picture.pict_type = I_TYPE;
2236 s->picture.key_frame = 1;
2238 for (i = 0; i < 3; i++)
2239 s->linesize[i] = s->picture.linesize[i] << s->interlaced;
2242 for (i = 0; i < 64; i++)
2244 j = s->scantable.permutated[i];
2245 s->quant_matrixes[0][j] = sp5x_quant_table[(qscale * 2) + i];
2247 s->qscale[0] = FFMAX(
2248 s->quant_matrixes[0][s->scantable.permutated[1]],
2249 s->quant_matrixes[0][s->scantable.permutated[8]]) >> 1;
2251 for (i = 0; i < 64; i++)
2253 j = s->scantable.permutated[i];
2254 s->quant_matrixes[1][j] = sp5x_quant_table[(qscale * 2) + 1 + i];
2256 s->qscale[1] = FFMAX(
2257 s->quant_matrixes[1][s->scantable.permutated[1]],
2258 s->quant_matrixes[1][s->scantable.permutated[8]]) >> 1;
2263 s->comp_index[0] = 0;
2264 s->nb_blocks[0] = s->h_count[0] * s->v_count[0];
2265 s->h_scount[0] = s->h_count[0];
2266 s->v_scount[0] = s->v_count[0];
2270 s->comp_index[1] = 1;
2271 s->nb_blocks[1] = s->h_count[1] * s->v_count[1];
2272 s->h_scount[1] = s->h_count[1];
2273 s->v_scount[1] = s->v_count[1];
2277 s->comp_index[2] = 2;
2278 s->nb_blocks[2] = s->h_count[2] * s->v_count[2];
2279 s->h_scount[2] = s->h_count[2];
2280 s->v_scount[2] = s->v_count[2];
2284 for (i = 0; i < 3; i++)
2285 s->last_dc[i] = 1024;
2287 s->mb_width = (s->width * s->h_max * 8 -1) / (s->h_max * 8);
2288 s->mb_height = (s->height * s->v_max * 8 -1) / (s->v_max * 8);
2290 init_get_bits(&s->gb, buf+14, (buf_size-14)*8);
2292 return mjpeg_decode_scan(s);
2298 static int mjpeg_decode_end(AVCodecContext *avctx)
2300 MJpegDecodeContext *s = avctx->priv_data;
2304 av_free(s->qscale_table);
2308 free_vlc(&s->vlcs[i][j]);
2313 AVCodec mjpeg_decoder = {
2317 sizeof(MJpegDecodeContext),
2326 AVCodec mjpegb_decoder = {
2330 sizeof(MJpegDecodeContext),
2334 mjpegb_decode_frame,
2339 AVCodec sp5x_decoder = {
2343 sizeof(MJpegDecodeContext),
2352 #ifdef CONFIG_ENCODERS
2353 AVCodec ljpeg_encoder = { //FIXME avoid MPV_* lossless jpeg shouldnt need them
2357 sizeof(MpegEncContext),
2359 encode_picture_lossless,
2364 AVCodecParser mjpeg_parser = {
2366 sizeof(ParseContext),