2 * Microsoft Screen 3 (aka Microsoft ATC Screen) decoder
3 * Copyright (c) 2012 Konstantin Shishkov
5 * This file is part of FFmpeg.
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
24 * Microsoft Screen 3 (aka Microsoft ATC Screen) decoder
28 #include "bytestream.h"
33 #define HEADER_SIZE 27
35 #define MODEL2_SCALE 13
36 #define MODEL_SCALE 15
37 #define MODEL256_SEC_SCALE 9
39 typedef struct Model2 {
40 int upd_val, till_rescale;
41 unsigned zero_freq, zero_weight;
42 unsigned total_freq, total_weight;
45 typedef struct Model {
46 int weights[16], freqs[16];
49 int upd_val, max_upd_val, till_rescale;
52 typedef struct Model256 {
53 int weights[256], freqs[256];
57 int upd_val, max_upd_val, till_rescale;
60 #define RAC_BOTTOM 0x01000000
61 typedef struct RangeCoder {
62 const uint8_t *src, *src_end;
76 typedef struct BlockTypeContext {
81 typedef struct FillBlockCoder {
86 typedef struct ImageBlockCoder {
87 Model256 esc_model, vec_entry_model;
92 typedef struct DCTBlockCoder {
94 ptrdiff_t prev_dc_stride;
103 typedef struct HaarBlockCoder {
109 typedef struct MSS3Context {
110 AVCodecContext *avctx;
115 BlockTypeContext btype[3];
116 FillBlockCoder fill_coder[3];
117 ImageBlockCoder image_coder[3];
118 DCTBlockCoder dct_coder[3];
119 HaarBlockCoder haar_coder[3];
126 static void model2_reset(Model2 *m)
130 m->zero_freq = 0x1000;
131 m->total_freq = 0x2000;
136 static void model2_update(Model2 *m, int bit)
146 m->total_weight += m->upd_val;
147 if (m->total_weight > 0x2000) {
148 m->total_weight = (m->total_weight + 1) >> 1;
149 m->zero_weight = (m->zero_weight + 1) >> 1;
150 if (m->total_weight == m->zero_weight)
151 m->total_weight = m->zero_weight + 1;
153 m->upd_val = m->upd_val * 5 >> 2;
156 scale = 0x80000000u / m->total_weight;
157 m->zero_freq = m->zero_weight * scale >> 18;
158 m->total_freq = m->total_weight * scale >> 18;
159 m->till_rescale = m->upd_val;
162 static void model_update(Model *m, int val)
171 m->tot_weight += m->upd_val;
173 if (m->tot_weight > 0x8000) {
175 for (i = 0; i < m->num_syms; i++) {
176 m->weights[i] = (m->weights[i] + 1) >> 1;
177 m->tot_weight += m->weights[i];
180 scale = 0x80000000u / m->tot_weight;
181 for (i = 0; i < m->num_syms; i++) {
182 m->freqs[i] = sum * scale >> 16;
183 sum += m->weights[i];
186 m->upd_val = m->upd_val * 5 >> 2;
187 if (m->upd_val > m->max_upd_val)
188 m->upd_val = m->max_upd_val;
189 m->till_rescale = m->upd_val;
192 static void model_reset(Model *m)
197 for (i = 0; i < m->num_syms - 1; i++)
199 m->weights[m->num_syms - 1] = 0;
201 m->upd_val = m->num_syms;
203 model_update(m, m->num_syms - 1);
205 m->upd_val = (m->num_syms + 6) >> 1;
208 static av_cold void model_init(Model *m, int num_syms)
210 m->num_syms = num_syms;
211 m->max_upd_val = 8 * num_syms + 48;
216 static void model256_update(Model256 *m, int val)
226 m->tot_weight += m->upd_val;
228 if (m->tot_weight > 0x8000) {
230 for (i = 0; i < 256; i++) {
231 m->weights[i] = (m->weights[i] + 1) >> 1;
232 m->tot_weight += m->weights[i];
235 scale = 0x80000000u / m->tot_weight;
237 for (i = 0; i < 256; i++) {
238 m->freqs[i] = sum * scale >> 16;
239 sum += m->weights[i];
240 send = m->freqs[i] >> MODEL256_SEC_SCALE;
242 m->secondary[sidx++] = i - 1;
244 while (sidx < m->sec_size)
245 m->secondary[sidx++] = 255;
247 m->upd_val = m->upd_val * 5 >> 2;
248 if (m->upd_val > m->max_upd_val)
249 m->upd_val = m->max_upd_val;
250 m->till_rescale = m->upd_val;
253 static void model256_reset(Model256 *m)
257 for (i = 0; i < 255; i++)
264 model256_update(m, 255);
266 m->upd_val = (256 + 6) >> 1;
269 static av_cold void model256_init(Model256 *m)
271 m->max_upd_val = 8 * 256 + 48;
272 m->sec_size = (1 << 6) + 2;
277 static void rac_init(RangeCoder *c, const uint8_t *src, int size)
282 c->src_end = src + size;
284 for (i = 0; i < FFMIN(size, 4); i++)
285 c->low = (c->low << 8) | *c->src++;
286 c->range = 0xFFFFFFFF;
290 static void rac_normalise(RangeCoder *c)
295 if (c->src < c->src_end) {
297 } else if (!c->low) {
301 if (c->low > c->range) {
305 if (c->range >= RAC_BOTTOM)
310 static int rac_get_bit(RangeCoder *c)
316 bit = (c->range <= c->low);
320 if (c->range < RAC_BOTTOM)
326 static int rac_get_bits(RangeCoder *c, int nbits)
331 val = c->low / c->range;
332 c->low -= c->range * val;
334 if (c->range < RAC_BOTTOM)
340 static int rac_get_model2_sym(RangeCoder *c, Model2 *m)
344 helper = m->zero_freq * (c->range >> MODEL2_SCALE);
345 bit = (c->low >= helper);
353 if (c->range < RAC_BOTTOM)
356 model2_update(m, bit);
361 static int rac_get_model_sym(RangeCoder *c, Model *m)
365 unsigned prob, prob2, helper;
369 c->range >>= MODEL_SCALE;
371 end = m->num_syms >> 1;
374 helper = m->freqs[end] * c->range;
375 if (helper <= c->low) {
382 end = (end2 + val) >> 1;
383 } while (end != val);
385 c->range = prob2 - prob;
386 if (c->range < RAC_BOTTOM)
389 model_update(m, val);
394 static int rac_get_model256_sym(RangeCoder *c, Model256 *m)
399 unsigned prob, prob2, helper;
402 c->range >>= MODEL_SCALE;
404 helper = c->low / c->range;
405 ssym = helper >> MODEL256_SEC_SCALE;
406 val = m->secondary[ssym];
408 end = start = m->secondary[ssym + 1] + 1;
409 while (end > val + 1) {
410 ssym = (end + val) >> 1;
411 if (m->freqs[ssym] <= helper) {
415 end = (end + val) >> 1;
419 prob = m->freqs[val] * c->range;
421 prob2 = m->freqs[val + 1] * c->range;
424 c->range = prob2 - prob;
425 if (c->range < RAC_BOTTOM)
428 model256_update(m, val);
433 static int decode_block_type(RangeCoder *c, BlockTypeContext *bt)
435 bt->last_type = rac_get_model_sym(c, &bt->bt_model[bt->last_type]);
437 return bt->last_type;
440 static int decode_coeff(RangeCoder *c, Model *m)
444 val = rac_get_model_sym(c, m);
446 sign = rac_get_bit(c);
449 val = (1 << val) + rac_get_bits(c, val);
458 static void decode_fill_block(RangeCoder *c, FillBlockCoder *fc,
459 uint8_t *dst, ptrdiff_t stride, int block_size)
463 fc->fill_val += decode_coeff(c, &fc->coef_model);
465 for (i = 0; i < block_size; i++, dst += stride)
466 memset(dst, fc->fill_val, block_size);
469 static void decode_image_block(RangeCoder *c, ImageBlockCoder *ic,
470 uint8_t *dst, ptrdiff_t stride, int block_size)
478 vec_size = rac_get_model_sym(c, &ic->vec_size_model) + 2;
479 for (i = 0; i < vec_size; i++)
480 vec[i] = rac_get_model256_sym(c, &ic->vec_entry_model);
483 memset(prev_line, 0, sizeof(prev_line));
485 for (j = 0; j < block_size; j++) {
488 for (i = 0; i < block_size; i++) {
491 A = rac_get_model_sym(c, &ic->vq_model[A + B * 5 + C * 25]);
497 dst[i] = rac_get_model256_sym(c, &ic->esc_model);
503 static int decode_dct(RangeCoder *c, DCTBlockCoder *bc, int *block,
506 int skip, val, sign, pos = 1, zz_pos, dc;
507 int blk_pos = bx + by * bc->prev_dc_stride;
509 memset(block, 0, sizeof(*block) * 64);
511 dc = decode_coeff(c, &bc->dc_model);
516 l = bc->prev_dc[blk_pos - 1];
517 tl = bc->prev_dc[blk_pos - 1 - bc->prev_dc_stride];
518 t = bc->prev_dc[blk_pos - bc->prev_dc_stride];
520 if (FFABS(t - tl) <= FFABS(l - tl))
525 dc += bc->prev_dc[blk_pos - bc->prev_dc_stride];
528 dc += bc->prev_dc[bx - 1];
530 bc->prev_dc[blk_pos] = dc;
531 block[0] = dc * bc->qmat[0];
534 val = rac_get_model256_sym(c, &bc->ac_model);
549 sign = rac_get_model2_sym(c, &bc->sign_model);
552 val = (1 << val) + rac_get_bits(c, val);
557 zz_pos = ff_zigzag_direct[pos];
558 block[zz_pos] = val * bc->qmat[zz_pos];
562 return pos == 64 ? 0 : -1;
565 static void decode_dct_block(RangeCoder *c, DCTBlockCoder *bc,
566 uint8_t *dst, ptrdiff_t stride, int block_size,
567 int *block, int mb_x, int mb_y)
571 int nblocks = block_size >> 3;
576 for (j = 0; j < nblocks; j++) {
577 for (i = 0; i < nblocks; i++) {
578 if (decode_dct(c, bc, block, bx + i, by + j)) {
582 ff_mss34_dct_put(dst + i * 8, stride, block);
588 static void decode_haar_block(RangeCoder *c, HaarBlockCoder *hc,
589 uint8_t *dst, ptrdiff_t stride,
590 int block_size, int *block)
592 const int hsize = block_size >> 1;
593 int A, B, C, D, t1, t2, t3, t4;
596 for (j = 0; j < block_size; j++) {
597 for (i = 0; i < block_size; i++) {
598 if (i < hsize && j < hsize)
599 block[i] = rac_get_model256_sym(c, &hc->coef_model);
601 block[i] = decode_coeff(c, &hc->coef_hi_model);
602 block[i] *= hc->scale;
606 block -= block_size * block_size;
608 for (j = 0; j < hsize; j++) {
609 for (i = 0; i < hsize; i++) {
611 B = block[i + hsize];
612 C = block[i + hsize * block_size];
613 D = block[i + hsize * block_size + hsize];
619 dst[i * 2] = av_clip_uint8(t1 - t2);
620 dst[i * 2 + stride] = av_clip_uint8(t1 + t2);
621 dst[i * 2 + 1] = av_clip_uint8(t3 - t4);
622 dst[i * 2 + 1 + stride] = av_clip_uint8(t3 + t4);
629 static void reset_coders(MSS3Context *ctx, int quality)
633 for (i = 0; i < 3; i++) {
634 ctx->btype[i].last_type = SKIP_BLOCK;
635 for (j = 0; j < 5; j++)
636 model_reset(&ctx->btype[i].bt_model[j]);
637 ctx->fill_coder[i].fill_val = 0;
638 model_reset(&ctx->fill_coder[i].coef_model);
639 model256_reset(&ctx->image_coder[i].esc_model);
640 model256_reset(&ctx->image_coder[i].vec_entry_model);
641 model_reset(&ctx->image_coder[i].vec_size_model);
642 for (j = 0; j < 125; j++)
643 model_reset(&ctx->image_coder[i].vq_model[j]);
644 if (ctx->dct_coder[i].quality != quality) {
645 ctx->dct_coder[i].quality = quality;
646 ff_mss34_gen_quant_mat(ctx->dct_coder[i].qmat, quality, !i);
648 memset(ctx->dct_coder[i].prev_dc, 0,
649 sizeof(*ctx->dct_coder[i].prev_dc) *
650 ctx->dct_coder[i].prev_dc_stride *
651 ctx->dct_coder[i].prev_dc_height);
652 model_reset(&ctx->dct_coder[i].dc_model);
653 model2_reset(&ctx->dct_coder[i].sign_model);
654 model256_reset(&ctx->dct_coder[i].ac_model);
655 if (ctx->haar_coder[i].quality != quality) {
656 ctx->haar_coder[i].quality = quality;
657 ctx->haar_coder[i].scale = 17 - 7 * quality / 50;
659 model_reset(&ctx->haar_coder[i].coef_hi_model);
660 model256_reset(&ctx->haar_coder[i].coef_model);
664 static av_cold void init_coders(MSS3Context *ctx)
668 for (i = 0; i < 3; i++) {
669 for (j = 0; j < 5; j++)
670 model_init(&ctx->btype[i].bt_model[j], 5);
671 model_init(&ctx->fill_coder[i].coef_model, 12);
672 model256_init(&ctx->image_coder[i].esc_model);
673 model256_init(&ctx->image_coder[i].vec_entry_model);
674 model_init(&ctx->image_coder[i].vec_size_model, 3);
675 for (j = 0; j < 125; j++)
676 model_init(&ctx->image_coder[i].vq_model[j], 5);
677 model_init(&ctx->dct_coder[i].dc_model, 12);
678 model256_init(&ctx->dct_coder[i].ac_model);
679 model_init(&ctx->haar_coder[i].coef_hi_model, 12);
680 model256_init(&ctx->haar_coder[i].coef_model);
684 static int mss3_decode_frame(AVCodecContext *avctx, void *data, int *got_frame,
687 const uint8_t *buf = avpkt->data;
688 int buf_size = avpkt->size;
689 MSS3Context *c = avctx->priv_data;
690 RangeCoder *acoder = &c->coder;
693 int dec_width, dec_height, dec_x, dec_y, quality, keyframe;
694 int x, y, i, mb_width, mb_height, blk_size, btype;
697 if (buf_size < HEADER_SIZE) {
698 av_log(avctx, AV_LOG_ERROR,
699 "Frame should have at least %d bytes, got %d instead\n",
700 HEADER_SIZE, buf_size);
701 return AVERROR_INVALIDDATA;
704 bytestream2_init(&gb, buf, buf_size);
705 keyframe = bytestream2_get_be32(&gb);
706 if (keyframe & ~0x301) {
707 av_log(avctx, AV_LOG_ERROR, "Invalid frame type %X\n", keyframe);
708 return AVERROR_INVALIDDATA;
710 keyframe = !(keyframe & 1);
711 bytestream2_skip(&gb, 6);
712 dec_x = bytestream2_get_be16(&gb);
713 dec_y = bytestream2_get_be16(&gb);
714 dec_width = bytestream2_get_be16(&gb);
715 dec_height = bytestream2_get_be16(&gb);
717 if (dec_x + dec_width > avctx->width ||
718 dec_y + dec_height > avctx->height ||
719 (dec_width | dec_height) & 0xF) {
720 av_log(avctx, AV_LOG_ERROR, "Invalid frame dimensions %dx%d +%d,%d\n",
721 dec_width, dec_height, dec_x, dec_y);
722 return AVERROR_INVALIDDATA;
724 bytestream2_skip(&gb, 4);
725 quality = bytestream2_get_byte(&gb);
726 if (quality < 1 || quality > 100) {
727 av_log(avctx, AV_LOG_ERROR, "Invalid quality setting %d\n", quality);
728 return AVERROR_INVALIDDATA;
730 bytestream2_skip(&gb, 4);
732 if (keyframe && !bytestream2_get_bytes_left(&gb)) {
733 av_log(avctx, AV_LOG_ERROR, "Keyframe without data found\n");
734 return AVERROR_INVALIDDATA;
736 if (!keyframe && c->got_error)
740 if ((ret = ff_reget_buffer(avctx, c->pic, 0)) < 0)
742 c->pic->key_frame = keyframe;
743 c->pic->pict_type = keyframe ? AV_PICTURE_TYPE_I : AV_PICTURE_TYPE_P;
744 if (!bytestream2_get_bytes_left(&gb)) {
745 if ((ret = av_frame_ref(data, c->pic)) < 0)
752 reset_coders(c, quality);
754 rac_init(acoder, buf + HEADER_SIZE, buf_size - HEADER_SIZE);
756 mb_width = dec_width >> 4;
757 mb_height = dec_height >> 4;
758 dst[0] = c->pic->data[0] + dec_x + dec_y * c->pic->linesize[0];
759 dst[1] = c->pic->data[1] + dec_x / 2 + (dec_y / 2) * c->pic->linesize[1];
760 dst[2] = c->pic->data[2] + dec_x / 2 + (dec_y / 2) * c->pic->linesize[2];
761 for (y = 0; y < mb_height; y++) {
762 for (x = 0; x < mb_width; x++) {
763 for (i = 0; i < 3; i++) {
766 btype = decode_block_type(acoder, c->btype + i);
769 decode_fill_block(acoder, c->fill_coder + i,
770 dst[i] + x * blk_size,
771 c->pic->linesize[i], blk_size);
774 decode_image_block(acoder, c->image_coder + i,
775 dst[i] + x * blk_size,
776 c->pic->linesize[i], blk_size);
779 decode_dct_block(acoder, c->dct_coder + i,
780 dst[i] + x * blk_size,
781 c->pic->linesize[i], blk_size,
785 decode_haar_block(acoder, c->haar_coder + i,
786 dst[i] + x * blk_size,
787 c->pic->linesize[i], blk_size,
791 if (c->got_error || acoder->got_error) {
792 av_log(avctx, AV_LOG_ERROR, "Error decoding block %d,%d\n",
795 return AVERROR_INVALIDDATA;
799 dst[0] += c->pic->linesize[0] * 16;
800 dst[1] += c->pic->linesize[1] * 8;
801 dst[2] += c->pic->linesize[2] * 8;
804 if ((ret = av_frame_ref(data, c->pic)) < 0)
812 static av_cold int mss3_decode_end(AVCodecContext *avctx)
814 MSS3Context * const c = avctx->priv_data;
817 av_frame_free(&c->pic);
818 for (i = 0; i < 3; i++)
819 av_freep(&c->dct_coder[i].prev_dc);
824 static av_cold int mss3_decode_init(AVCodecContext *avctx)
826 MSS3Context * const c = avctx->priv_data;
831 if ((avctx->width & 0xF) || (avctx->height & 0xF)) {
832 av_log(avctx, AV_LOG_ERROR,
833 "Image dimensions should be a multiple of 16.\n");
834 return AVERROR_INVALIDDATA;
838 for (i = 0; i < 3; i++) {
839 int b_width = avctx->width >> (2 + !!i);
840 int b_height = avctx->height >> (2 + !!i);
841 c->dct_coder[i].prev_dc_stride = b_width;
842 c->dct_coder[i].prev_dc_height = b_height;
843 c->dct_coder[i].prev_dc = av_malloc(sizeof(*c->dct_coder[i].prev_dc) *
845 if (!c->dct_coder[i].prev_dc) {
846 av_log(avctx, AV_LOG_ERROR, "Cannot allocate buffer\n");
847 av_frame_free(&c->pic);
849 av_freep(&c->dct_coder[i].prev_dc);
852 return AVERROR(ENOMEM);
856 c->pic = av_frame_alloc();
858 mss3_decode_end(avctx);
859 return AVERROR(ENOMEM);
862 avctx->pix_fmt = AV_PIX_FMT_YUV420P;
869 AVCodec ff_msa1_decoder = {
871 .long_name = NULL_IF_CONFIG_SMALL("MS ATC Screen"),
872 .type = AVMEDIA_TYPE_VIDEO,
873 .id = AV_CODEC_ID_MSA1,
874 .priv_data_size = sizeof(MSS3Context),
875 .init = mss3_decode_init,
876 .close = mss3_decode_end,
877 .decode = mss3_decode_frame,
878 .capabilities = AV_CODEC_CAP_DR1,