2 * Copyright (c) 2002-2003 Michael Niedermayer <michaelni@gmx.at>
4 * see http://www.pcisys.net/~melanson/codecs/huffyuv.txt for a description of
7 * This file is part of Libav.
9 * Libav is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU Lesser General Public
11 * License as published by the Free Software Foundation; either
12 * version 2.1 of the License, or (at your option) any later version.
14 * Libav is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17 * Lesser General Public License for more details.
19 * You should have received a copy of the GNU Lesser General Public
20 * License along with Libav; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
32 #include "huffyuvencdsp.h"
36 static inline int sub_left_prediction(HYuvContext *s, uint8_t *dst,
37 uint8_t *src, int w, int left)
41 for (i = 0; i < w; i++) {
42 const int temp = src[i];
48 for (i = 0; i < 16; i++) {
49 const int temp = src[i];
53 s->hencdsp.diff_bytes(dst + 16, src + 16, src + 15, w - 16);
58 static inline void sub_left_prediction_bgr32(HYuvContext *s, uint8_t *dst,
60 int *red, int *green, int *blue,
70 for (i = 0; i < FFMIN(w, 4); i++) {
71 const int rt = src[i * 4 + R];
72 const int gt = src[i * 4 + G];
73 const int bt = src[i * 4 + B];
74 const int at = src[i * 4 + A];
75 dst[i * 4 + R] = rt - r;
76 dst[i * 4 + G] = gt - g;
77 dst[i * 4 + B] = bt - b;
78 dst[i * 4 + A] = at - a;
85 s->hencdsp.diff_bytes(dst + 16, src + 16, src + 12, w * 4 - 16);
87 *red = src[(w - 1) * 4 + R];
88 *green = src[(w - 1) * 4 + G];
89 *blue = src[(w - 1) * 4 + B];
90 *alpha = src[(w - 1) * 4 + A];
93 static inline void sub_left_prediction_rgb24(HYuvContext *s, uint8_t *dst,
95 int *red, int *green, int *blue)
102 for (i = 0; i < FFMIN(w, 16); i++) {
103 const int rt = src[i * 3 + 0];
104 const int gt = src[i * 3 + 1];
105 const int bt = src[i * 3 + 2];
106 dst[i * 3 + 0] = rt - r;
107 dst[i * 3 + 1] = gt - g;
108 dst[i * 3 + 2] = bt - b;
114 s->hencdsp.diff_bytes(dst + 48, src + 48, src + 48 - 3, w * 3 - 48);
116 *red = src[(w - 1) * 3 + 0];
117 *green = src[(w - 1) * 3 + 1];
118 *blue = src[(w - 1) * 3 + 2];
121 static int store_table(HYuvContext *s, const uint8_t *len, uint8_t *buf)
126 for (i = 0; i < 256;) {
130 for (; i < 256 && len[i] == val && repeat < 255; i++)
133 assert(val < 32 && val >0 && repeat<256 && repeat>0);
136 buf[index++] = repeat;
138 buf[index++] = val | (repeat << 5);
145 static av_cold int encode_init(AVCodecContext *avctx)
147 HYuvContext *s = avctx->priv_data;
150 ff_huffyuv_common_init(avctx);
151 ff_huffyuvencdsp_init(&s->hencdsp);
153 avctx->extradata = av_mallocz(1024*30); // 256*3+4 == 772
154 avctx->stats_out = av_mallocz(1024*30); // 21*256*3(%llu ) + 3(\n) + 1(0) = 16132
157 if (!avctx->extradata || !avctx->stats_out)
158 return AVERROR(ENOMEM);
160 #if FF_API_CODED_FRAME
161 FF_DISABLE_DEPRECATION_WARNINGS
162 avctx->coded_frame->pict_type = AV_PICTURE_TYPE_I;
163 avctx->coded_frame->key_frame = 1;
164 FF_ENABLE_DEPRECATION_WARNINGS
167 switch (avctx->pix_fmt) {
168 case AV_PIX_FMT_YUV420P:
169 case AV_PIX_FMT_YUV422P:
171 av_log(avctx, AV_LOG_ERROR, "Width must be even for this colorspace.\n");
174 s->bitstream_bpp = avctx->pix_fmt == AV_PIX_FMT_YUV420P ? 12 : 16;
176 case AV_PIX_FMT_RGB32:
177 s->bitstream_bpp = 32;
179 case AV_PIX_FMT_RGB24:
180 s->bitstream_bpp = 24;
183 av_log(avctx, AV_LOG_ERROR, "format not supported\n");
186 avctx->bits_per_coded_sample = s->bitstream_bpp;
187 s->decorrelate = s->bitstream_bpp >= 24;
188 s->predictor = avctx->prediction_method;
189 s->interlaced = avctx->flags & AV_CODEC_FLAG_INTERLACED_ME ? 1 : 0;
190 if (avctx->context_model == 1) {
191 s->context = avctx->context_model;
192 if (s->flags & (AV_CODEC_FLAG_PASS1 | AV_CODEC_FLAG_PASS2)) {
193 av_log(avctx, AV_LOG_ERROR,
194 "context=1 is not compatible with "
195 "2 pass huffyuv encoding\n");
200 if (avctx->codec->id == AV_CODEC_ID_HUFFYUV) {
201 if (avctx->pix_fmt == AV_PIX_FMT_YUV420P) {
202 av_log(avctx, AV_LOG_ERROR,
203 "Error: YV12 is not supported by huffyuv; use "
204 "vcodec=ffvhuff or format=422p\n");
207 if (avctx->context_model) {
208 av_log(avctx, AV_LOG_ERROR,
209 "Error: per-frame huffman tables are not supported "
210 "by huffyuv; use vcodec=ffvhuff\n");
213 if (s->interlaced != ( s->height > 288 ))
214 av_log(avctx, AV_LOG_INFO,
215 "using huffyuv 2.2.0 or newer interlacing flag\n");
218 if (s->bitstream_bpp >= 24 && s->predictor == MEDIAN) {
219 av_log(avctx, AV_LOG_ERROR,
220 "Error: RGB is incompatible with median predictor\n");
224 ((uint8_t*)avctx->extradata)[0] = s->predictor | (s->decorrelate << 6);
225 ((uint8_t*)avctx->extradata)[1] = s->bitstream_bpp;
226 ((uint8_t*)avctx->extradata)[2] = s->interlaced ? 0x10 : 0x20;
228 ((uint8_t*)avctx->extradata)[2] |= 0x40;
229 ((uint8_t*)avctx->extradata)[3] = 0;
230 s->avctx->extradata_size = 4;
232 if (avctx->stats_in) {
233 char *p = avctx->stats_in;
235 for (i = 0; i < 3; i++)
236 for (j = 0; j < 256; j++)
240 for (i = 0; i < 3; i++) {
243 for (j = 0; j < 256; j++) {
244 s->stats[i][j] += strtol(p, &next, 0);
245 if (next == p) return -1;
249 if (p[0] == 0 || p[1] == 0 || p[2] == 0) break;
252 for (i = 0; i < 3; i++)
253 for (j = 0; j < 256; j++) {
254 int d = FFMIN(j, 256 - j);
256 s->stats[i][j] = 100000000 / (d + 1);
260 for (i = 0; i < 3; i++) {
261 ff_huff_gen_len_table(s->len[i], s->stats[i]);
263 if (ff_huffyuv_generate_bits_table(s->bits[i], s->len[i]) < 0) {
267 s->avctx->extradata_size +=
268 store_table(s, s->len[i], &((uint8_t*)s->avctx->extradata)[s->avctx->extradata_size]);
272 for (i = 0; i < 3; i++) {
273 int pels = s->width * s->height / (i ? 40 : 10);
274 for (j = 0; j < 256; j++) {
275 int d = FFMIN(j, 256 - j);
276 s->stats[i][j] = pels/(d + 1);
280 for (i = 0; i < 3; i++)
281 for (j = 0; j < 256; j++)
285 ff_huffyuv_alloc_temp(s);
291 static int encode_422_bitstream(HYuvContext *s, int offset, int count)
294 const uint8_t *y = s->temp[0] + offset;
295 const uint8_t *u = s->temp[1] + offset / 2;
296 const uint8_t *v = s->temp[2] + offset / 2;
298 if (s->pb.buf_end - s->pb.buf - (put_bits_count(&s->pb) >> 3) < 2 * 4 * count) {
299 av_log(s->avctx, AV_LOG_ERROR, "encoded frame too large\n");
305 int y1 = y[2 * i + 1];\
311 if (s->flags & AV_CODEC_FLAG_PASS1) {
312 for(i = 0; i < count; i++) {
320 if (s->avctx->flags2 & AV_CODEC_FLAG2_NO_OUTPUT)
323 for (i = 0; i < count; i++) {
326 put_bits(&s->pb, s->len[0][y0], s->bits[0][y0]);
328 put_bits(&s->pb, s->len[1][u0], s->bits[1][u0]);
330 put_bits(&s->pb, s->len[0][y1], s->bits[0][y1]);
332 put_bits(&s->pb, s->len[2][v0], s->bits[2][v0]);
335 for(i = 0; i < count; i++) {
337 put_bits(&s->pb, s->len[0][y0], s->bits[0][y0]);
338 put_bits(&s->pb, s->len[1][u0], s->bits[1][u0]);
339 put_bits(&s->pb, s->len[0][y1], s->bits[0][y1]);
340 put_bits(&s->pb, s->len[2][v0], s->bits[2][v0]);
346 static int encode_gray_bitstream(HYuvContext *s, int count)
350 if (s->pb.buf_end - s->pb.buf - (put_bits_count(&s->pb) >> 3) < 4 * count) {
351 av_log(s->avctx, AV_LOG_ERROR, "encoded frame too large\n");
356 int y0 = s->temp[0][2 * i];\
357 int y1 = s->temp[0][2 * i + 1];
362 put_bits(&s->pb, s->len[0][y0], s->bits[0][y0]);\
363 put_bits(&s->pb, s->len[0][y1], s->bits[0][y1]);
367 if (s->flags & AV_CODEC_FLAG_PASS1) {
368 for (i = 0; i < count; i++) {
373 if (s->avctx->flags2 & AV_CODEC_FLAG2_NO_OUTPUT)
377 for (i = 0; i < count; i++) {
383 for (i = 0; i < count; i++) {
391 static inline int encode_bgra_bitstream(HYuvContext *s, int count, int planes)
395 if (s->pb.buf_end - s->pb.buf - (put_bits_count(&s->pb) >> 3) <
396 4 * planes * count) {
397 av_log(s->avctx, AV_LOG_ERROR, "encoded frame too large\n");
402 int g = s->temp[0][planes == 3 ? 3 * i + 1 : 4 * i + G]; \
403 int b = s->temp[0][planes == 3 ? 3 * i + 2 : 4 * i + B] - g & 0xFF; \
404 int r = s->temp[0][planes == 3 ? 3 * i + 0 : 4 * i + R] - g & 0xFF; \
405 int a = s->temp[0][planes * i + A];
415 put_bits(&s->pb, s->len[1][g], s->bits[1][g]); \
416 put_bits(&s->pb, s->len[0][b], s->bits[0][b]); \
417 put_bits(&s->pb, s->len[2][r], s->bits[2][r]); \
419 put_bits(&s->pb, s->len[2][a], s->bits[2][a]);
421 if ((s->flags & AV_CODEC_FLAG_PASS1) &&
422 (s->avctx->flags2 & AV_CODEC_FLAG2_NO_OUTPUT)) {
423 for (i = 0; i < count; i++) {
427 } else if (s->context || (s->flags & AV_CODEC_FLAG_PASS1)) {
428 for (i = 0; i < count; i++) {
434 for (i = 0; i < count; i++) {
442 static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,
443 const AVFrame *pict, int *got_packet)
445 HYuvContext *s = avctx->priv_data;
446 const int width = s->width;
447 const int width2 = s->width>>1;
448 const int height = s->height;
449 const int fake_ystride = s->interlaced ? pict->linesize[0]*2 : pict->linesize[0];
450 const int fake_ustride = s->interlaced ? pict->linesize[1]*2 : pict->linesize[1];
451 const int fake_vstride = s->interlaced ? pict->linesize[2]*2 : pict->linesize[2];
452 const AVFrame * const p = pict;
453 int i, j, size = 0, ret;
456 (ret = av_new_packet(pkt, width * height * 3 * 4 + FF_MIN_BUFFER_SIZE)) < 0) {
457 av_log(avctx, AV_LOG_ERROR, "Error allocating output packet.\n");
462 for (i = 0; i < 3; i++) {
463 ff_huff_gen_len_table(s->len[i], s->stats[i]);
464 if (ff_huffyuv_generate_bits_table(s->bits[i], s->len[i]) < 0)
466 size += store_table(s, s->len[i], &pkt->data[size]);
469 for (i = 0; i < 3; i++)
470 for (j = 0; j < 256; j++)
471 s->stats[i][j] >>= 1;
474 init_put_bits(&s->pb, pkt->data + size, pkt->size - size);
476 if (avctx->pix_fmt == AV_PIX_FMT_YUV422P ||
477 avctx->pix_fmt == AV_PIX_FMT_YUV420P) {
478 int lefty, leftu, leftv, y, cy;
480 put_bits(&s->pb, 8, leftv = p->data[2][0]);
481 put_bits(&s->pb, 8, lefty = p->data[0][1]);
482 put_bits(&s->pb, 8, leftu = p->data[1][0]);
483 put_bits(&s->pb, 8, p->data[0][0]);
485 lefty = sub_left_prediction(s, s->temp[0], p->data[0], width , 0);
486 leftu = sub_left_prediction(s, s->temp[1], p->data[1], width2, 0);
487 leftv = sub_left_prediction(s, s->temp[2], p->data[2], width2, 0);
489 encode_422_bitstream(s, 2, width-2);
491 if (s->predictor==MEDIAN) {
492 int lefttopy, lefttopu, lefttopv;
495 lefty = sub_left_prediction(s, s->temp[0], p->data[0] + p->linesize[0], width , lefty);
496 leftu = sub_left_prediction(s, s->temp[1], p->data[1] + p->linesize[1], width2, leftu);
497 leftv = sub_left_prediction(s, s->temp[2], p->data[2] + p->linesize[2], width2, leftv);
499 encode_422_bitstream(s, 0, width);
503 lefty = sub_left_prediction(s, s->temp[0], p->data[0] + fake_ystride, 4, lefty);
504 leftu = sub_left_prediction(s, s->temp[1], p->data[1] + fake_ustride, 2, leftu);
505 leftv = sub_left_prediction(s, s->temp[2], p->data[2] + fake_vstride, 2, leftv);
507 encode_422_bitstream(s, 0, 4);
509 lefttopy = p->data[0][3];
510 lefttopu = p->data[1][1];
511 lefttopv = p->data[2][1];
512 s->hencdsp.sub_hfyu_median_pred(s->temp[0], p->data[0] + 4, p->data[0] + fake_ystride + 4, width - 4, &lefty, &lefttopy);
513 s->hencdsp.sub_hfyu_median_pred(s->temp[1], p->data[1] + 2, p->data[1] + fake_ustride + 2, width2 - 2, &leftu, &lefttopu);
514 s->hencdsp.sub_hfyu_median_pred(s->temp[2], p->data[2] + 2, p->data[2] + fake_vstride + 2, width2 - 2, &leftv, &lefttopv);
515 encode_422_bitstream(s, 0, width - 4);
518 for (; y < height; y++,cy++) {
519 uint8_t *ydst, *udst, *vdst;
521 if (s->bitstream_bpp == 12) {
523 ydst = p->data[0] + p->linesize[0] * y;
524 s->hencdsp.sub_hfyu_median_pred(s->temp[0], ydst - fake_ystride, ydst, width, &lefty, &lefttopy);
525 encode_gray_bitstream(s, width);
528 if (y >= height) break;
530 ydst = p->data[0] + p->linesize[0] * y;
531 udst = p->data[1] + p->linesize[1] * cy;
532 vdst = p->data[2] + p->linesize[2] * cy;
534 s->hencdsp.sub_hfyu_median_pred(s->temp[0], ydst - fake_ystride, ydst, width, &lefty, &lefttopy);
535 s->hencdsp.sub_hfyu_median_pred(s->temp[1], udst - fake_ustride, udst, width2, &leftu, &lefttopu);
536 s->hencdsp.sub_hfyu_median_pred(s->temp[2], vdst - fake_vstride, vdst, width2, &leftv, &lefttopv);
538 encode_422_bitstream(s, 0, width);
541 for (cy = y = 1; y < height; y++, cy++) {
542 uint8_t *ydst, *udst, *vdst;
544 /* encode a luma only line & y++ */
545 if (s->bitstream_bpp == 12) {
546 ydst = p->data[0] + p->linesize[0] * y;
548 if (s->predictor == PLANE && s->interlaced < y) {
549 s->hencdsp.diff_bytes(s->temp[1], ydst, ydst - fake_ystride, width);
551 lefty = sub_left_prediction(s, s->temp[0], s->temp[1], width , lefty);
553 lefty = sub_left_prediction(s, s->temp[0], ydst, width , lefty);
555 encode_gray_bitstream(s, width);
557 if (y >= height) break;
560 ydst = p->data[0] + p->linesize[0] * y;
561 udst = p->data[1] + p->linesize[1] * cy;
562 vdst = p->data[2] + p->linesize[2] * cy;
564 if (s->predictor == PLANE && s->interlaced < cy) {
565 s->hencdsp.diff_bytes(s->temp[1], ydst, ydst - fake_ystride, width);
566 s->hencdsp.diff_bytes(s->temp[2], udst, udst - fake_ustride, width2);
567 s->hencdsp.diff_bytes(s->temp[2] + width2, vdst, vdst - fake_vstride, width2);
569 lefty = sub_left_prediction(s, s->temp[0], s->temp[1], width , lefty);
570 leftu = sub_left_prediction(s, s->temp[1], s->temp[2], width2, leftu);
571 leftv = sub_left_prediction(s, s->temp[2], s->temp[2] + width2, width2, leftv);
573 lefty = sub_left_prediction(s, s->temp[0], ydst, width , lefty);
574 leftu = sub_left_prediction(s, s->temp[1], udst, width2, leftu);
575 leftv = sub_left_prediction(s, s->temp[2], vdst, width2, leftv);
578 encode_422_bitstream(s, 0, width);
581 } else if(avctx->pix_fmt == AV_PIX_FMT_RGB32) {
582 uint8_t *data = p->data[0] + (height - 1) * p->linesize[0];
583 const int stride = -p->linesize[0];
584 const int fake_stride = -fake_ystride;
586 int leftr, leftg, leftb, lefta;
588 put_bits(&s->pb, 8, lefta = data[A]);
589 put_bits(&s->pb, 8, leftr = data[R]);
590 put_bits(&s->pb, 8, leftg = data[G]);
591 put_bits(&s->pb, 8, leftb = data[B]);
593 sub_left_prediction_bgr32(s, s->temp[0], data + 4, width - 1,
594 &leftr, &leftg, &leftb, &lefta);
595 encode_bgra_bitstream(s, width - 1, 4);
597 for (y = 1; y < s->height; y++) {
598 uint8_t *dst = data + y*stride;
599 if (s->predictor == PLANE && s->interlaced < y) {
600 s->hencdsp.diff_bytes(s->temp[1], dst, dst - fake_stride, width * 4);
601 sub_left_prediction_bgr32(s, s->temp[0], s->temp[1], width,
602 &leftr, &leftg, &leftb, &lefta);
604 sub_left_prediction_bgr32(s, s->temp[0], dst, width,
605 &leftr, &leftg, &leftb, &lefta);
607 encode_bgra_bitstream(s, width, 4);
609 } else if (avctx->pix_fmt == AV_PIX_FMT_RGB24) {
610 uint8_t *data = p->data[0] + (height - 1) * p->linesize[0];
611 const int stride = -p->linesize[0];
612 const int fake_stride = -fake_ystride;
614 int leftr, leftg, leftb;
616 put_bits(&s->pb, 8, leftr = data[0]);
617 put_bits(&s->pb, 8, leftg = data[1]);
618 put_bits(&s->pb, 8, leftb = data[2]);
619 put_bits(&s->pb, 8, 0);
621 sub_left_prediction_rgb24(s, s->temp[0], data + 3, width - 1,
622 &leftr, &leftg, &leftb);
623 encode_bgra_bitstream(s, width-1, 3);
625 for (y = 1; y < s->height; y++) {
626 uint8_t *dst = data + y * stride;
627 if (s->predictor == PLANE && s->interlaced < y) {
628 s->hencdsp.diff_bytes(s->temp[1], dst, dst - fake_stride,
630 sub_left_prediction_rgb24(s, s->temp[0], s->temp[1], width,
631 &leftr, &leftg, &leftb);
633 sub_left_prediction_rgb24(s, s->temp[0], dst, width,
634 &leftr, &leftg, &leftb);
636 encode_bgra_bitstream(s, width, 3);
639 av_log(avctx, AV_LOG_ERROR, "Format not supported!\n");
643 size += (put_bits_count(&s->pb) + 31) / 8;
644 put_bits(&s->pb, 16, 0);
645 put_bits(&s->pb, 15, 0);
648 if ((s->flags & AV_CODEC_FLAG_PASS1) && (s->picture_number & 31) == 0) {
650 char *p = avctx->stats_out;
651 char *end = p + 1024*30;
652 for (i = 0; i < 3; i++) {
653 for (j = 0; j < 256; j++) {
654 snprintf(p, end-p, "%"PRIu64" ", s->stats[i][j]);
658 snprintf(p, end-p, "\n");
662 avctx->stats_out[0] = '\0';
663 if (!(s->avctx->flags2 & AV_CODEC_FLAG2_NO_OUTPUT)) {
664 flush_put_bits(&s->pb);
665 s->bdsp.bswap_buf((uint32_t *) pkt->data, (uint32_t *) pkt->data, size);
670 pkt->size = size * 4;
671 pkt->flags |= AV_PKT_FLAG_KEY;
677 static av_cold int encode_end(AVCodecContext *avctx)
679 HYuvContext *s = avctx->priv_data;
681 ff_huffyuv_common_end(s);
683 av_freep(&avctx->extradata);
684 av_freep(&avctx->stats_out);
689 AVCodec ff_huffyuv_encoder = {
691 .long_name = NULL_IF_CONFIG_SMALL("Huffyuv / HuffYUV"),
692 .type = AVMEDIA_TYPE_VIDEO,
693 .id = AV_CODEC_ID_HUFFYUV,
694 .priv_data_size = sizeof(HYuvContext),
696 .encode2 = encode_frame,
698 .pix_fmts = (const enum AVPixelFormat[]){
699 AV_PIX_FMT_YUV422P, AV_PIX_FMT_RGB24,
700 AV_PIX_FMT_RGB32, AV_PIX_FMT_NONE
702 .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE |
703 FF_CODEC_CAP_INIT_CLEANUP,
706 #if CONFIG_FFVHUFF_ENCODER
707 AVCodec ff_ffvhuff_encoder = {
709 .long_name = NULL_IF_CONFIG_SMALL("Huffyuv FFmpeg variant"),
710 .type = AVMEDIA_TYPE_VIDEO,
711 .id = AV_CODEC_ID_FFVHUFF,
712 .priv_data_size = sizeof(HYuvContext),
714 .encode2 = encode_frame,
716 .pix_fmts = (const enum AVPixelFormat[]){
717 AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUV422P, AV_PIX_FMT_RGB24,
718 AV_PIX_FMT_RGB32, AV_PIX_FMT_NONE
720 .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE |
721 FF_CODEC_CAP_INIT_CLEANUP,