git.sesse.net Git - ffmpeg/blob - libavcodec/flacenc.c

   1 /*
   2  * FLAC audio encoder
   3  * Copyright (c) 2006  Justin Ruggles <justin.ruggles@gmail.com>
   4  *
   5  * This file is part of FFmpeg.
   6  *
   7  * FFmpeg is free software; you can redistribute it and/or
   8  * modify it under the terms of the GNU Lesser General Public
   9  * License as published by the Free Software Foundation; either
  10  * version 2.1 of the License, or (at your option) any later version.
  11  *
  12  * FFmpeg is distributed in the hope that it will be useful,
  13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  15  * Lesser General Public License for more details.
  16  *
  17  * You should have received a copy of the GNU Lesser General Public
  18  * License along with FFmpeg; if not, write to the Free Software
  19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20  */
  21
  22 #include "libavutil/avassert.h"
  23 #include "libavutil/crc.h"
  24 #include "libavutil/intmath.h"
  25 #include "libavutil/md5.h"
  26 #include "libavutil/opt.h"
  27 #include "avcodec.h"
  28 #include "bswapdsp.h"
  29 #include "put_bits.h"
  30 #include "golomb.h"
  31 #include "internal.h"
  32 #include "lpc.h"
  33 #include "flac.h"
  34 #include "flacdata.h"
  35 #include "flacdsp.h"
  36
  37 #define FLAC_SUBFRAME_CONSTANT  0
  38 #define FLAC_SUBFRAME_VERBATIM  1
  39 #define FLAC_SUBFRAME_FIXED     8
  40 #define FLAC_SUBFRAME_LPC      32
  41
  42 #define MAX_FIXED_ORDER     4
  43 #define MAX_PARTITION_ORDER 8
  44 #define MAX_PARTITIONS     (1 << MAX_PARTITION_ORDER)
  45 #define MAX_LPC_PRECISION  15
  46 #define MAX_LPC_SHIFT      15
  47
  48 enum CodingMode {
  49     CODING_MODE_RICE  = 4,
  50     CODING_MODE_RICE2 = 5,
  51 };
  52
  53 typedef struct CompressionOptions {
  54     int compression_level;
  55     int block_time_ms;
  56     enum FFLPCType lpc_type;
  57     int lpc_passes;
  58     int lpc_coeff_precision;
  59     int min_prediction_order;
  60     int max_prediction_order;
  61     int prediction_order_method;
  62     int min_partition_order;
  63     int max_partition_order;
  64     int ch_mode;
  65 } CompressionOptions;
  66
  67 typedef struct RiceContext {
  68     enum CodingMode coding_mode;
  69     int porder;
  70     int params[MAX_PARTITIONS];
  71 } RiceContext;
  72
  73 typedef struct FlacSubframe {
  74     int type;
  75     int type_code;
  76     int obits;
  77     int wasted;
  78     int order;
  79     int32_t coefs[MAX_LPC_ORDER];
  80     int shift;
  81     RiceContext rc;
  82     int32_t samples[FLAC_MAX_BLOCKSIZE];
  83     int32_t residual[FLAC_MAX_BLOCKSIZE+11];
  84 } FlacSubframe;
  85
  86 typedef struct FlacFrame {
  87     FlacSubframe subframes[FLAC_MAX_CHANNELS];
  88     int blocksize;
  89     int bs_code[2];
  90     uint8_t crc8;
  91     int ch_mode;
  92     int verbatim_only;
  93 } FlacFrame;
  94
  95 typedef struct FlacEncodeContext {
  96     AVClass *class;
  97     PutBitContext pb;
  98     int channels;
  99     int samplerate;
 100     int sr_code[2];
 101     int bps_code;
 102     int max_blocksize;
 103     int min_framesize;
 104     int max_framesize;
 105     int max_encoded_framesize;
 106     uint32_t frame_count;
 107     uint64_t sample_count;
 108     uint8_t md5sum[16];
 109     FlacFrame frame;
 110     CompressionOptions options;
 111     AVCodecContext *avctx;
 112     LPCContext lpc_ctx;
 113     struct AVMD5 *md5ctx;
 114     uint8_t *md5_buffer;
 115     unsigned int md5_buffer_size;
 116     BswapDSPContext bdsp;
 117     FLACDSPContext flac_dsp;
 118
 119     int flushed;
 120     int64_t next_pts;
 121 } FlacEncodeContext;
 122
 123
 124 /**
 125  * Write streaminfo metadata block to byte array.
 126  */
 127 static void write_streaminfo(FlacEncodeContext *s, uint8_t *header)
 128 {
 129     PutBitContext pb;
 130
 131     memset(header, 0, FLAC_STREAMINFO_SIZE);
 132     init_put_bits(&pb, header, FLAC_STREAMINFO_SIZE);
 133
 134     /* streaminfo metadata block */
 135     put_bits(&pb, 16, s->max_blocksize);
 136     put_bits(&pb, 16, s->max_blocksize);
 137     put_bits(&pb, 24, s->min_framesize);
 138     put_bits(&pb, 24, s->max_framesize);
 139     put_bits(&pb, 20, s->samplerate);
 140     put_bits(&pb, 3, s->channels-1);
 141     put_bits(&pb,  5, s->avctx->bits_per_raw_sample - 1);
 142     /* write 36-bit sample count in 2 put_bits() calls */
 143     put_bits(&pb, 24, (s->sample_count & 0xFFFFFF000LL) >> 12);
 144     put_bits(&pb, 12,  s->sample_count & 0x000000FFFLL);
 145     flush_put_bits(&pb);
 146     memcpy(&header[18], s->md5sum, 16);
 147 }
 148
 149
 150 /**
 151  * Set blocksize based on samplerate.
 152  * Choose the closest predefined blocksize >= BLOCK_TIME_MS milliseconds.
 153  */
 154 static int select_blocksize(int samplerate, int block_time_ms)
 155 {
 156     int i;
 157     int target;
 158     int blocksize;
 159
 160     av_assert0(samplerate > 0);
 161     blocksize = ff_flac_blocksize_table[1];
 162     target    = (samplerate * block_time_ms) / 1000;
 163     for (i = 0; i < 16; i++) {
 164         if (target >= ff_flac_blocksize_table[i] &&
 165             ff_flac_blocksize_table[i] > blocksize) {
 166             blocksize = ff_flac_blocksize_table[i];
 167         }
 168     }
 169     return blocksize;
 170 }
 171
 172
 173 static av_cold void dprint_compression_options(FlacEncodeContext *s)
 174 {
 175     AVCodecContext     *avctx = s->avctx;
 176     CompressionOptions *opt   = &s->options;
 177
 178     av_log(avctx, AV_LOG_DEBUG, " compression: %d\n", opt->compression_level);
 179
 180     switch (opt->lpc_type) {
 181     case FF_LPC_TYPE_NONE:
 182         av_log(avctx, AV_LOG_DEBUG, " lpc type: None\n");
 183         break;
 184     case FF_LPC_TYPE_FIXED:
 185         av_log(avctx, AV_LOG_DEBUG, " lpc type: Fixed pre-defined coefficients\n");
 186         break;
 187     case FF_LPC_TYPE_LEVINSON:
 188         av_log(avctx, AV_LOG_DEBUG, " lpc type: Levinson-Durbin recursion with Welch window\n");
 189         break;
 190     case FF_LPC_TYPE_CHOLESKY:
 191         av_log(avctx, AV_LOG_DEBUG, " lpc type: Cholesky factorization, %d pass%s\n",
 192                opt->lpc_passes, opt->lpc_passes == 1 ? "" : "es");
 193         break;
 194     }
 195
 196     av_log(avctx, AV_LOG_DEBUG, " prediction order: %d, %d\n",
 197            opt->min_prediction_order, opt->max_prediction_order);
 198
 199     switch (opt->prediction_order_method) {
 200     case ORDER_METHOD_EST:
 201         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "estimate");
 202         break;
 203     case ORDER_METHOD_2LEVEL:
 204         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "2-level");
 205         break;
 206     case ORDER_METHOD_4LEVEL:
 207         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "4-level");
 208         break;
 209     case ORDER_METHOD_8LEVEL:
 210         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "8-level");
 211         break;
 212     case ORDER_METHOD_SEARCH:
 213         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "full search");
 214         break;
 215     case ORDER_METHOD_LOG:
 216         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "log search");
 217         break;
 218     }
 219
 220
 221     av_log(avctx, AV_LOG_DEBUG, " partition order: %d, %d\n",
 222            opt->min_partition_order, opt->max_partition_order);
 223
 224     av_log(avctx, AV_LOG_DEBUG, " block size: %d\n", avctx->frame_size);
 225
 226     av_log(avctx, AV_LOG_DEBUG, " lpc precision: %d\n",
 227            opt->lpc_coeff_precision);
 228 }
 229
 230
 231 static av_cold int flac_encode_init(AVCodecContext *avctx)
 232 {
 233     int freq = avctx->sample_rate;
 234     int channels = avctx->channels;
 235     FlacEncodeContext *s = avctx->priv_data;
 236     int i, level, ret;
 237     uint8_t *streaminfo;
 238
 239     s->avctx = avctx;
 240
 241     switch (avctx->sample_fmt) {
 242     case AV_SAMPLE_FMT_S16:
 243         avctx->bits_per_raw_sample = 16;
 244         s->bps_code                = 4;
 245         break;
 246     case AV_SAMPLE_FMT_S32:
 247         if (avctx->bits_per_raw_sample != 24)
 248             av_log(avctx, AV_LOG_WARNING, "encoding as 24 bits-per-sample\n");
 249         avctx->bits_per_raw_sample = 24;
 250         s->bps_code                = 6;
 251         break;
 252     }
 253
 254     if (channels < 1 || channels > FLAC_MAX_CHANNELS) {
 255         av_log(avctx, AV_LOG_ERROR, "%d channels not supported (max %d)\n",
 256                channels, FLAC_MAX_CHANNELS);
 257         return AVERROR(EINVAL);
 258     }
 259     s->channels = channels;
 260
 261     /* find samplerate in table */
 262     if (freq < 1)
 263         return -1;
 264     for (i = 4; i < 12; i++) {
 265         if (freq == ff_flac_sample_rate_table[i]) {
 266             s->samplerate = ff_flac_sample_rate_table[i];
 267             s->sr_code[0] = i;
 268             s->sr_code[1] = 0;
 269             break;
 270         }
 271     }
 272     /* if not in table, samplerate is non-standard */
 273     if (i == 12) {
 274         if (freq % 1000 == 0 && freq < 255000) {
 275             s->sr_code[0] = 12;
 276             s->sr_code[1] = freq / 1000;
 277         } else if (freq % 10 == 0 && freq < 655350) {
 278             s->sr_code[0] = 14;
 279             s->sr_code[1] = freq / 10;
 280         } else if (freq < 65535) {
 281             s->sr_code[0] = 13;
 282             s->sr_code[1] = freq;
 283         } else {
 284             av_log(avctx, AV_LOG_ERROR, "%d Hz not supported\n", freq);
 285             return AVERROR(EINVAL);
 286         }
 287         s->samplerate = freq;
 288     }
 289
 290     /* set compression option defaults based on avctx->compression_level */
 291     if (avctx->compression_level < 0)
 292         s->options.compression_level = 5;
 293     else
 294         s->options.compression_level = avctx->compression_level;
 295
 296     level = s->options.compression_level;
 297     if (level > 12) {
 298         av_log(avctx, AV_LOG_ERROR, "invalid compression level: %d\n",
 299                s->options.compression_level);
 300         return AVERROR(EINVAL);
 301     }
 302
 303     s->options.block_time_ms = ((int[]){ 27, 27, 27,105,105,105,105,105,105,105,105,105,105})[level];
 304
 305     if (s->options.lpc_type == FF_LPC_TYPE_DEFAULT)
 306         s->options.lpc_type  = ((int[]){ FF_LPC_TYPE_FIXED,    FF_LPC_TYPE_FIXED,    FF_LPC_TYPE_FIXED,
 307                                          FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON,
 308                                          FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON,
 309                                          FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON, FF_LPC_TYPE_LEVINSON,
 310                                          FF_LPC_TYPE_LEVINSON})[level];
 311
 312     s->options.min_prediction_order = ((int[]){  2,  0,  0,  1,  1,  1,  1,  1,  1,  1,  1,  1,  1})[level];
 313     s->options.max_prediction_order = ((int[]){  3,  4,  4,  6,  8,  8,  8,  8, 12, 12, 12, 32, 32})[level];
 314
 315     if (s->options.prediction_order_method < 0)
 316         s->options.prediction_order_method = ((int[]){ ORDER_METHOD_EST,    ORDER_METHOD_EST,    ORDER_METHOD_EST,
 317                                                        ORDER_METHOD_EST,    ORDER_METHOD_EST,    ORDER_METHOD_EST,
 318                                                        ORDER_METHOD_4LEVEL, ORDER_METHOD_LOG,    ORDER_METHOD_4LEVEL,
 319                                                        ORDER_METHOD_LOG,    ORDER_METHOD_SEARCH, ORDER_METHOD_LOG,
 320                                                        ORDER_METHOD_SEARCH})[level];
 321
 322     if (s->options.min_partition_order > s->options.max_partition_order) {
 323         av_log(avctx, AV_LOG_ERROR, "invalid partition orders: min=%d max=%d\n",
 324                s->options.min_partition_order, s->options.max_partition_order);
 325         return AVERROR(EINVAL);
 326     }
 327     if (s->options.min_partition_order < 0)
 328         s->options.min_partition_order = ((int[]){  2,  2,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0})[level];
 329     if (s->options.max_partition_order < 0)
 330         s->options.max_partition_order = ((int[]){  2,  2,  3,  3,  3,  8,  8,  8,  8,  8,  8,  8,  8})[level];
 331
 332     if (s->options.lpc_type == FF_LPC_TYPE_NONE) {
 333         s->options.min_prediction_order = 0;
 334     } else if (avctx->min_prediction_order >= 0) {
 335         if (s->options.lpc_type == FF_LPC_TYPE_FIXED) {
 336             if (avctx->min_prediction_order > MAX_FIXED_ORDER) {
 337                 av_log(avctx, AV_LOG_ERROR, "invalid min prediction order: %d\n",
 338                        avctx->min_prediction_order);
 339                 return AVERROR(EINVAL);
 340             }
 341         } else if (avctx->min_prediction_order < MIN_LPC_ORDER ||
 342                    avctx->min_prediction_order > MAX_LPC_ORDER) {
 343             av_log(avctx, AV_LOG_ERROR, "invalid min prediction order: %d\n",
 344                    avctx->min_prediction_order);
 345             return AVERROR(EINVAL);
 346         }
 347         s->options.min_prediction_order = avctx->min_prediction_order;
 348     }
 349     if (s->options.lpc_type == FF_LPC_TYPE_NONE) {
 350         s->options.max_prediction_order = 0;
 351     } else if (avctx->max_prediction_order >= 0) {
 352         if (s->options.lpc_type == FF_LPC_TYPE_FIXED) {
 353             if (avctx->max_prediction_order > MAX_FIXED_ORDER) {
 354                 av_log(avctx, AV_LOG_ERROR, "invalid max prediction order: %d\n",
 355                        avctx->max_prediction_order);
 356                 return AVERROR(EINVAL);
 357             }
 358         } else if (avctx->max_prediction_order < MIN_LPC_ORDER ||
 359                    avctx->max_prediction_order > MAX_LPC_ORDER) {
 360             av_log(avctx, AV_LOG_ERROR, "invalid max prediction order: %d\n",
 361                    avctx->max_prediction_order);
 362             return AVERROR(EINVAL);
 363         }
 364         s->options.max_prediction_order = avctx->max_prediction_order;
 365     }
 366     if (s->options.max_prediction_order < s->options.min_prediction_order) {
 367         av_log(avctx, AV_LOG_ERROR, "invalid prediction orders: min=%d max=%d\n",
 368                s->options.min_prediction_order, s->options.max_prediction_order);
 369         return AVERROR(EINVAL);
 370     }
 371
 372     if (avctx->frame_size > 0) {
 373         if (avctx->frame_size < FLAC_MIN_BLOCKSIZE ||
 374                 avctx->frame_size > FLAC_MAX_BLOCKSIZE) {
 375             av_log(avctx, AV_LOG_ERROR, "invalid block size: %d\n",
 376                    avctx->frame_size);
 377             return AVERROR(EINVAL);
 378         }
 379     } else {
 380         s->avctx->frame_size = select_blocksize(s->samplerate, s->options.block_time_ms);
 381     }
 382     s->max_blocksize = s->avctx->frame_size;
 383
 384     /* set maximum encoded frame size in verbatim mode */
 385     s->max_framesize = ff_flac_get_max_frame_size(s->avctx->frame_size,
 386                                                   s->channels,
 387                                                   s->avctx->bits_per_raw_sample);
 388
 389     /* initialize MD5 context */
 390     s->md5ctx = av_md5_alloc();
 391     if (!s->md5ctx)
 392         return AVERROR(ENOMEM);
 393     av_md5_init(s->md5ctx);
 394
 395     streaminfo = av_malloc(FLAC_STREAMINFO_SIZE);
 396     if (!streaminfo)
 397         return AVERROR(ENOMEM);
 398     write_streaminfo(s, streaminfo);
 399     avctx->extradata = streaminfo;
 400     avctx->extradata_size = FLAC_STREAMINFO_SIZE;
 401
 402     s->frame_count   = 0;
 403     s->min_framesize = s->max_framesize;
 404
 405     if (channels == 3 &&
 406             avctx->channel_layout != (AV_CH_LAYOUT_STEREO|AV_CH_FRONT_CENTER) ||
 407         channels == 4 &&
 408             avctx->channel_layout != AV_CH_LAYOUT_2_2 &&
 409             avctx->channel_layout != AV_CH_LAYOUT_QUAD ||
 410         channels == 5 &&
 411             avctx->channel_layout != AV_CH_LAYOUT_5POINT0 &&
 412             avctx->channel_layout != AV_CH_LAYOUT_5POINT0_BACK ||
 413         channels == 6 &&
 414             avctx->channel_layout != AV_CH_LAYOUT_5POINT1 &&
 415             avctx->channel_layout != AV_CH_LAYOUT_5POINT1_BACK) {
 416         if (avctx->channel_layout) {
 417             av_log(avctx, AV_LOG_ERROR, "Channel layout not supported by Flac, "
 418                                              "output stream will have incorrect "
 419                                              "channel layout.\n");
 420         } else {
 421             av_log(avctx, AV_LOG_WARNING, "No channel layout specified. The encoder "
 422                                                "will use Flac channel layout for "
 423                                                "%d channels.\n", channels);
 424         }
 425     }
 426
 427     ret = ff_lpc_init(&s->lpc_ctx, avctx->frame_size,
 428                       s->options.max_prediction_order, FF_LPC_TYPE_LEVINSON);
 429
 430     ff_bswapdsp_init(&s->bdsp);
 431     ff_flacdsp_init(&s->flac_dsp, avctx->sample_fmt, channels,
 432                     avctx->bits_per_raw_sample);
 433
 434     dprint_compression_options(s);
 435
 436     return ret;
 437 }
 438
 439
 440 static void init_frame(FlacEncodeContext *s, int nb_samples)
 441 {
 442     int i, ch;
 443     FlacFrame *frame;
 444
 445     frame = &s->frame;
 446
 447     for (i = 0; i < 16; i++) {
 448         if (nb_samples == ff_flac_blocksize_table[i]) {
 449             frame->blocksize  = ff_flac_blocksize_table[i];
 450             frame->bs_code[0] = i;
 451             frame->bs_code[1] = 0;
 452             break;
 453         }
 454     }
 455     if (i == 16) {
 456         frame->blocksize = nb_samples;
 457         if (frame->blocksize <= 256) {
 458             frame->bs_code[0] = 6;
 459             frame->bs_code[1] = frame->blocksize-1;
 460         } else {
 461             frame->bs_code[0] = 7;
 462             frame->bs_code[1] = frame->blocksize-1;
 463         }
 464     }
 465
 466     for (ch = 0; ch < s->channels; ch++) {
 467         FlacSubframe *sub = &frame->subframes[ch];
 468
 469         sub->wasted = 0;
 470         sub->obits  = s->avctx->bits_per_raw_sample;
 471
 472         if (sub->obits > 16)
 473             sub->rc.coding_mode = CODING_MODE_RICE2;
 474         else
 475             sub->rc.coding_mode = CODING_MODE_RICE;
 476     }
 477
 478     frame->verbatim_only = 0;
 479 }
 480
 481
 482 /**
 483  * Copy channel-interleaved input samples into separate subframes.
 484  */
 485 static void copy_samples(FlacEncodeContext *s, const void *samples)
 486 {
 487     int i, j, ch;
 488     FlacFrame *frame;
 489     int shift = av_get_bytes_per_sample(s->avctx->sample_fmt) * 8 -
 490                 s->avctx->bits_per_raw_sample;
 491
 492 #define COPY_SAMPLES(bits) do {                                     \
 493     const int ## bits ## _t *samples0 = samples;                    \
 494     frame = &s->frame;                                              \
 495     for (i = 0, j = 0; i < frame->blocksize; i++)                   \
 496         for (ch = 0; ch < s->channels; ch++, j++)                   \
 497             frame->subframes[ch].samples[i] = samples0[j] >> shift; \
 498 } while (0)
 499
 500     if (s->avctx->sample_fmt == AV_SAMPLE_FMT_S16)
 501         COPY_SAMPLES(16);
 502     else
 503         COPY_SAMPLES(32);
 504 }
 505
 506
 507 static uint64_t rice_count_exact(int32_t *res, int n, int k)
 508 {
 509     int i;
 510     uint64_t count = 0;
 511
 512     for (i = 0; i < n; i++) {
 513         int32_t v = -2 * res[i] - 1;
 514         v ^= v >> 31;
 515         count += (v >> k) + 1 + k;
 516     }
 517     return count;
 518 }
 519
 520
 521 static uint64_t subframe_count_exact(FlacEncodeContext *s, FlacSubframe *sub,
 522                                      int pred_order)
 523 {
 524     int p, porder, psize;
 525     int i, part_end;
 526     uint64_t count = 0;
 527
 528     /* subframe header */
 529     count += 8;
 530
 531     if (sub->wasted)
 532         count += sub->wasted;
 533
 534     /* subframe */
 535     if (sub->type == FLAC_SUBFRAME_CONSTANT) {
 536         count += sub->obits;
 537     } else if (sub->type == FLAC_SUBFRAME_VERBATIM) {
 538         count += s->frame.blocksize * sub->obits;
 539     } else {
 540         /* warm-up samples */
 541         count += pred_order * sub->obits;
 542
 543         /* LPC coefficients */
 544         if (sub->type == FLAC_SUBFRAME_LPC)
 545             count += 4 + 5 + pred_order * s->options.lpc_coeff_precision;
 546
 547         /* rice-encoded block */
 548         count += 2;
 549
 550         /* partition order */
 551         porder = sub->rc.porder;
 552         psize  = s->frame.blocksize >> porder;
 553         count += 4;
 554
 555         /* residual */
 556         i        = pred_order;
 557         part_end = psize;
 558         for (p = 0; p < 1 << porder; p++) {
 559             int k = sub->rc.params[p];
 560             count += sub->rc.coding_mode;
 561             count += rice_count_exact(&sub->residual[i], part_end - i, k);
 562             i = part_end;
 563             part_end = FFMIN(s->frame.blocksize, part_end + psize);
 564         }
 565     }
 566
 567     return count;
 568 }
 569
 570
 571 #define rice_encode_count(sum, n, k) (((n)*((k)+1))+((sum-(n>>1))>>(k)))
 572
 573 /**
 574  * Solve for d/dk(rice_encode_count) = n-((sum-(n>>1))>>(k+1)) = 0.
 575  */
 576 static int find_optimal_param(uint64_t sum, int n, int max_param)
 577 {
 578     int k;
 579     uint64_t sum2;
 580
 581     if (sum <= n >> 1)
 582         return 0;
 583     sum2 = sum - (n >> 1);
 584     k    = av_log2(av_clipl_int32(sum2 / n));
 585     return FFMIN(k, max_param);
 586 }
 587
 588
 589 static uint64_t calc_optimal_rice_params(RiceContext *rc, int porder,
 590                                          uint64_t *sums, int n, int pred_order)
 591 {
 592     int i;
 593     int k, cnt, part, max_param;
 594     uint64_t all_bits;
 595
 596     max_param = (1 << rc->coding_mode) - 2;
 597
 598     part     = (1 << porder);
 599     all_bits = 4 * part;
 600
 601     cnt = (n >> porder) - pred_order;
 602     for (i = 0; i < part; i++) {
 603         k = find_optimal_param(sums[i], cnt, max_param);
 604         rc->params[i] = k;
 605         all_bits += rice_encode_count(sums[i], cnt, k);
 606         cnt = n >> porder;
 607     }
 608
 609     rc->porder = porder;
 610
 611     return all_bits;
 612 }
 613
 614
 615 static void calc_sum_top(int pmax, uint32_t *data, int n, int pred_order,
 616                          uint64_t sums[MAX_PARTITIONS])
 617 {
 618     int i;
 619     int parts;
 620     uint32_t *res, *res_end;
 621
 622     /* sums for highest level */
 623     parts   = (1 << pmax);
 624     res     = &data[pred_order];
 625     res_end = &data[n >> pmax];
 626     for (i = 0; i < parts; i++) {
 627         uint64_t sum = 0;
 628         while (res < res_end)
 629             sum += *(res++);
 630         sums[i] = sum;
 631         res_end += n >> pmax;
 632     }
 633 }
 634
 635 static void calc_sum_next(int level, uint64_t sums[MAX_PARTITIONS])
 636 {
 637     int i;
 638     int parts = (1 << level);
 639     for (i = 0; i < parts; i++)
 640         sums[i] = sums[2*i] + sums[2*i+1];
 641 }
 642
 643 static uint64_t calc_rice_params(RiceContext *rc, int pmin, int pmax,
 644                                  int32_t *data, int n, int pred_order)
 645 {
 646     int i;
 647     uint64_t bits[MAX_PARTITION_ORDER+1];
 648     int opt_porder;
 649     RiceContext tmp_rc;
 650     uint32_t *udata;
 651     uint64_t sums[MAX_PARTITIONS];
 652
 653     av_assert1(pmin >= 0 && pmin <= MAX_PARTITION_ORDER);
 654     av_assert1(pmax >= 0 && pmax <= MAX_PARTITION_ORDER);
 655     av_assert1(pmin <= pmax);
 656
 657     tmp_rc.coding_mode = rc->coding_mode;
 658
 659     udata = av_malloc_array(n,  sizeof(uint32_t));
 660     for (i = 0; i < n; i++)
 661         udata[i] = (2*data[i]) ^ (data[i]>>31);
 662
 663     calc_sum_top(pmax, udata, n, pred_order, sums);
 664
 665     opt_porder = pmin;
 666     bits[pmin] = UINT32_MAX;
 667     for (i = pmax; ; ) {
 668         bits[i] = calc_optimal_rice_params(&tmp_rc, i, sums, n, pred_order);
 669         if (bits[i] < bits[opt_porder]) {
 670             opt_porder = i;
 671             *rc = tmp_rc;
 672         }
 673         if (i == pmin)
 674             break;
 675         calc_sum_next(--i, sums);
 676     }
 677
 678     av_freep(&udata);
 679     return bits[opt_porder];
 680 }
 681
 682
 683 static int get_max_p_order(int max_porder, int n, int order)
 684 {
 685     int porder = FFMIN(max_porder, av_log2(n^(n-1)));
 686     if (order > 0)
 687         porder = FFMIN(porder, av_log2(n/order));
 688     return porder;
 689 }
 690
 691
 692 static uint64_t find_subframe_rice_params(FlacEncodeContext *s,
 693                                           FlacSubframe *sub, int pred_order)
 694 {
 695     int pmin = get_max_p_order(s->options.min_partition_order,
 696                                s->frame.blocksize, pred_order);
 697     int pmax = get_max_p_order(s->options.max_partition_order,
 698                                s->frame.blocksize, pred_order);
 699
 700     uint64_t bits = 8 + pred_order * sub->obits + 2 + sub->rc.coding_mode;
 701     if (sub->type == FLAC_SUBFRAME_LPC)
 702         bits += 4 + 5 + pred_order * s->options.lpc_coeff_precision;
 703     bits += calc_rice_params(&sub->rc, pmin, pmax, sub->residual,
 704                              s->frame.blocksize, pred_order);
 705     return bits;
 706 }
 707
 708
 709 static void encode_residual_fixed(int32_t *res, const int32_t *smp, int n,
 710                                   int order)
 711 {
 712     int i;
 713
 714     for (i = 0; i < order; i++)
 715         res[i] = smp[i];
 716
 717     if (order == 0) {
 718         for (i = order; i < n; i++)
 719             res[i] = smp[i];
 720     } else if (order == 1) {
 721         for (i = order; i < n; i++)
 722             res[i] = smp[i] - smp[i-1];
 723     } else if (order == 2) {
 724         int a = smp[order-1] - smp[order-2];
 725         for (i = order; i < n; i += 2) {
 726             int b    = smp[i  ] - smp[i-1];
 727             res[i]   = b - a;
 728             a        = smp[i+1] - smp[i  ];
 729             res[i+1] = a - b;
 730         }
 731     } else if (order == 3) {
 732         int a = smp[order-1] -   smp[order-2];
 733         int c = smp[order-1] - 2*smp[order-2] + smp[order-3];
 734         for (i = order; i < n; i += 2) {
 735             int b    = smp[i  ] - smp[i-1];
 736             int d    = b - a;
 737             res[i]   = d - c;
 738             a        = smp[i+1] - smp[i  ];
 739             c        = a - b;
 740             res[i+1] = c - d;
 741         }
 742     } else {
 743         int a = smp[order-1] -   smp[order-2];
 744         int c = smp[order-1] - 2*smp[order-2] +   smp[order-3];
 745         int e = smp[order-1] - 3*smp[order-2] + 3*smp[order-3] - smp[order-4];
 746         for (i = order; i < n; i += 2) {
 747             int b    = smp[i  ] - smp[i-1];
 748             int d    = b - a;
 749             int f    = d - c;
 750             res[i  ] = f - e;
 751             a        = smp[i+1] - smp[i  ];
 752             c        = a - b;
 753             e        = c - d;
 754             res[i+1] = e - f;
 755         }
 756     }
 757 }
 758
 759
 760 static int encode_residual_ch(FlacEncodeContext *s, int ch)
 761 {
 762     int i, n;
 763     int min_order, max_order, opt_order, omethod;
 764     FlacFrame *frame;
 765     FlacSubframe *sub;
 766     int32_t coefs[MAX_LPC_ORDER][MAX_LPC_ORDER];
 767     int shift[MAX_LPC_ORDER];
 768     int32_t *res, *smp;
 769
 770     frame = &s->frame;
 771     sub   = &frame->subframes[ch];
 772     res   = sub->residual;
 773     smp   = sub->samples;
 774     n     = frame->blocksize;
 775
 776     /* CONSTANT */
 777     for (i = 1; i < n; i++)
 778         if(smp[i] != smp[0])
 779             break;
 780     if (i == n) {
 781         sub->type = sub->type_code = FLAC_SUBFRAME_CONSTANT;
 782         res[0] = smp[0];
 783         return subframe_count_exact(s, sub, 0);
 784     }
 785
 786     /* VERBATIM */
 787     if (frame->verbatim_only || n < 5) {
 788         sub->type = sub->type_code = FLAC_SUBFRAME_VERBATIM;
 789         memcpy(res, smp, n * sizeof(int32_t));
 790         return subframe_count_exact(s, sub, 0);
 791     }
 792
 793     min_order  = s->options.min_prediction_order;
 794     max_order  = s->options.max_prediction_order;
 795     omethod    = s->options.prediction_order_method;
 796
 797     /* FIXED */
 798     sub->type = FLAC_SUBFRAME_FIXED;
 799     if (s->options.lpc_type == FF_LPC_TYPE_NONE  ||
 800         s->options.lpc_type == FF_LPC_TYPE_FIXED || n <= max_order) {
 801         uint64_t bits[MAX_FIXED_ORDER+1];
 802         if (max_order > MAX_FIXED_ORDER)
 803             max_order = MAX_FIXED_ORDER;
 804         opt_order = 0;
 805         bits[0]   = UINT32_MAX;
 806         for (i = min_order; i <= max_order; i++) {
 807             encode_residual_fixed(res, smp, n, i);
 808             bits[i] = find_subframe_rice_params(s, sub, i);
 809             if (bits[i] < bits[opt_order])
 810                 opt_order = i;
 811         }
 812         sub->order     = opt_order;
 813         sub->type_code = sub->type | sub->order;
 814         if (sub->order != max_order) {
 815             encode_residual_fixed(res, smp, n, sub->order);
 816             find_subframe_rice_params(s, sub, sub->order);
 817         }
 818         return subframe_count_exact(s, sub, sub->order);
 819     }
 820
 821     /* LPC */
 822     sub->type = FLAC_SUBFRAME_LPC;
 823     opt_order = ff_lpc_calc_coefs(&s->lpc_ctx, smp, n, min_order, max_order,
 824                                   s->options.lpc_coeff_precision, coefs, shift, s->options.lpc_type,
 825                                   s->options.lpc_passes, omethod,
 826                                   MAX_LPC_SHIFT, 0);
 827
 828     if (omethod == ORDER_METHOD_2LEVEL ||
 829         omethod == ORDER_METHOD_4LEVEL ||
 830         omethod == ORDER_METHOD_8LEVEL) {
 831         int levels = 1 << omethod;
 832         uint64_t bits[1 << ORDER_METHOD_8LEVEL];
 833         int order       = -1;
 834         int opt_index   = levels-1;
 835         opt_order       = max_order-1;
 836         bits[opt_index] = UINT32_MAX;
 837         for (i = levels-1; i >= 0; i--) {
 838             int last_order = order;
 839             order = min_order + (((max_order-min_order+1) * (i+1)) / levels)-1;
 840             order = av_clip(order, min_order - 1, max_order - 1);
 841             if (order == last_order)
 842                 continue;
 843             s->flac_dsp.lpc_encode(res, smp, n, order+1, coefs[order],
 844                                    shift[order]);
 845             bits[i] = find_subframe_rice_params(s, sub, order+1);
 846             if (bits[i] < bits[opt_index]) {
 847                 opt_index = i;
 848                 opt_order = order;
 849             }
 850         }
 851         opt_order++;
 852     } else if (omethod == ORDER_METHOD_SEARCH) {
 853         // brute-force optimal order search
 854         uint64_t bits[MAX_LPC_ORDER];
 855         opt_order = 0;
 856         bits[0]   = UINT32_MAX;
 857         for (i = min_order-1; i < max_order; i++) {
 858             s->flac_dsp.lpc_encode(res, smp, n, i+1, coefs[i], shift[i]);
 859             bits[i] = find_subframe_rice_params(s, sub, i+1);
 860             if (bits[i] < bits[opt_order])
 861                 opt_order = i;
 862         }
 863         opt_order++;
 864     } else if (omethod == ORDER_METHOD_LOG) {
 865         uint64_t bits[MAX_LPC_ORDER];
 866         int step;
 867
 868         opt_order = min_order - 1 + (max_order-min_order)/3;
 869         memset(bits, -1, sizeof(bits));
 870
 871         for (step = 16; step; step >>= 1) {
 872             int last = opt_order;
 873             for (i = last-step; i <= last+step; i += step) {
 874                 if (i < min_order-1 || i >= max_order || bits[i] < UINT32_MAX)
 875                     continue;
 876                 s->flac_dsp.lpc_encode(res, smp, n, i+1, coefs[i], shift[i]);
 877                 bits[i] = find_subframe_rice_params(s, sub, i+1);
 878                 if (bits[i] < bits[opt_order])
 879                     opt_order = i;
 880             }
 881         }
 882         opt_order++;
 883     }
 884
 885     sub->order     = opt_order;
 886     sub->type_code = sub->type | (sub->order-1);
 887     sub->shift     = shift[sub->order-1];
 888     for (i = 0; i < sub->order; i++)
 889         sub->coefs[i] = coefs[sub->order-1][i];
 890
 891     s->flac_dsp.lpc_encode(res, smp, n, sub->order, sub->coefs, sub->shift);
 892
 893     find_subframe_rice_params(s, sub, sub->order);
 894
 895     return subframe_count_exact(s, sub, sub->order);
 896 }
 897
 898
 899 static int count_frame_header(FlacEncodeContext *s)
 900 {
 901     uint8_t av_unused tmp;
 902     int count;
 903
 904     /*
 905     <14> Sync code
 906     <1>  Reserved
 907     <1>  Blocking strategy
 908     <4>  Block size in inter-channel samples
 909     <4>  Sample rate
 910     <4>  Channel assignment
 911     <3>  Sample size in bits
 912     <1>  Reserved
 913     */
 914     count = 32;
 915
 916     /* coded frame number */
 917     PUT_UTF8(s->frame_count, tmp, count += 8;)
 918
 919     /* explicit block size */
 920     if (s->frame.bs_code[0] == 6)
 921         count += 8;
 922     else if (s->frame.bs_code[0] == 7)
 923         count += 16;
 924
 925     /* explicit sample rate */
 926     count += ((s->sr_code[0] == 12) + (s->sr_code[0] > 12)) * 8;
 927
 928     /* frame header CRC-8 */
 929     count += 8;
 930
 931     return count;
 932 }
 933
 934
 935 static int encode_frame(FlacEncodeContext *s)
 936 {
 937     int ch;
 938     uint64_t count;
 939
 940     count = count_frame_header(s);
 941
 942     for (ch = 0; ch < s->channels; ch++)
 943         count += encode_residual_ch(s, ch);
 944
 945     count += (8 - (count & 7)) & 7; // byte alignment
 946     count += 16;                    // CRC-16
 947
 948     count >>= 3;
 949     if (count > INT_MAX)
 950         return AVERROR_BUG;
 951     return count;
 952 }
 953
 954
 955 static void remove_wasted_bits(FlacEncodeContext *s)
 956 {
 957     int ch, i;
 958
 959     for (ch = 0; ch < s->channels; ch++) {
 960         FlacSubframe *sub = &s->frame.subframes[ch];
 961         int32_t v         = 0;
 962
 963         for (i = 0; i < s->frame.blocksize; i++) {
 964             v |= sub->samples[i];
 965             if (v & 1)
 966                 break;
 967         }
 968
 969         if (v && !(v & 1)) {
 970             v = av_ctz(v);
 971
 972             for (i = 0; i < s->frame.blocksize; i++)
 973                 sub->samples[i] >>= v;
 974
 975             sub->wasted = v;
 976             sub->obits -= v;
 977
 978             /* for 24-bit, check if removing wasted bits makes the range better
 979                suited for using RICE instead of RICE2 for entropy coding */
 980             if (sub->obits <= 17)
 981                 sub->rc.coding_mode = CODING_MODE_RICE;
 982         }
 983     }
 984 }
 985
 986
 987 static int estimate_stereo_mode(int32_t *left_ch, int32_t *right_ch, int n,
 988                                 int max_rice_param)
 989 {
 990     int i, best;
 991     int32_t lt, rt;
 992     uint64_t sum[4];
 993     uint64_t score[4];
 994     int k;
 995
 996     /* calculate sum of 2nd order residual for each channel */
 997     sum[0] = sum[1] = sum[2] = sum[3] = 0;
 998     for (i = 2; i < n; i++) {
 999         lt = left_ch[i]  - 2*left_ch[i-1]  + left_ch[i-2];
1000         rt = right_ch[i] - 2*right_ch[i-1] + right_ch[i-2];
1001         sum[2] += FFABS((lt + rt) >> 1);
1002         sum[3] += FFABS(lt - rt);
1003         sum[0] += FFABS(lt);
1004         sum[1] += FFABS(rt);
1005     }
1006     /* estimate bit counts */
1007     for (i = 0; i < 4; i++) {
1008         k      = find_optimal_param(2 * sum[i], n, max_rice_param);
1009         sum[i] = rice_encode_count( 2 * sum[i], n, k);
1010     }
1011
1012     /* calculate score for each mode */
1013     score[0] = sum[0] + sum[1];
1014     score[1] = sum[0] + sum[3];
1015     score[2] = sum[1] + sum[3];
1016     score[3] = sum[2] + sum[3];
1017
1018     /* return mode with lowest score */
1019     best = 0;
1020     for (i = 1; i < 4; i++)
1021         if (score[i] < score[best])
1022             best = i;
1023
1024     return best;
1025 }
1026
1027
1028 /**
1029  * Perform stereo channel decorrelation.
1030  */
1031 static void channel_decorrelation(FlacEncodeContext *s)
1032 {
1033     FlacFrame *frame;
1034     int32_t *left, *right;
1035     int i, n;
1036
1037     frame = &s->frame;
1038     n     = frame->blocksize;
1039     left  = frame->subframes[0].samples;
1040     right = frame->subframes[1].samples;
1041
1042     if (s->channels != 2) {
1043         frame->ch_mode = FLAC_CHMODE_INDEPENDENT;
1044         return;
1045     }
1046
1047     if (s->options.ch_mode < 0) {
1048         int max_rice_param = (1 << frame->subframes[0].rc.coding_mode) - 2;
1049         frame->ch_mode = estimate_stereo_mode(left, right, n, max_rice_param);
1050     } else
1051         frame->ch_mode = s->options.ch_mode;
1052
1053     /* perform decorrelation and adjust bits-per-sample */
1054     if (frame->ch_mode == FLAC_CHMODE_INDEPENDENT)
1055         return;
1056     if (frame->ch_mode == FLAC_CHMODE_MID_SIDE) {
1057         int32_t tmp;
1058         for (i = 0; i < n; i++) {
1059             tmp      = left[i];
1060             left[i]  = (tmp + right[i]) >> 1;
1061             right[i] =  tmp - right[i];
1062         }
1063         frame->subframes[1].obits++;
1064     } else if (frame->ch_mode == FLAC_CHMODE_LEFT_SIDE) {
1065         for (i = 0; i < n; i++)
1066             right[i] = left[i] - right[i];
1067         frame->subframes[1].obits++;
1068     } else {
1069         for (i = 0; i < n; i++)
1070             left[i] -= right[i];
1071         frame->subframes[0].obits++;
1072     }
1073 }
1074
1075
1076 static void write_utf8(PutBitContext *pb, uint32_t val)
1077 {
1078     uint8_t tmp;
1079     PUT_UTF8(val, tmp, put_bits(pb, 8, tmp);)
1080 }
1081
1082
1083 static void write_frame_header(FlacEncodeContext *s)
1084 {
1085     FlacFrame *frame;
1086     int crc;
1087
1088     frame = &s->frame;
1089
1090     put_bits(&s->pb, 16, 0xFFF8);
1091     put_bits(&s->pb, 4, frame->bs_code[0]);
1092     put_bits(&s->pb, 4, s->sr_code[0]);
1093
1094     if (frame->ch_mode == FLAC_CHMODE_INDEPENDENT)
1095         put_bits(&s->pb, 4, s->channels-1);
1096     else
1097         put_bits(&s->pb, 4, frame->ch_mode + FLAC_MAX_CHANNELS - 1);
1098
1099     put_bits(&s->pb, 3, s->bps_code);
1100     put_bits(&s->pb, 1, 0);
1101     write_utf8(&s->pb, s->frame_count);
1102
1103     if (frame->bs_code[0] == 6)
1104         put_bits(&s->pb, 8, frame->bs_code[1]);
1105     else if (frame->bs_code[0] == 7)
1106         put_bits(&s->pb, 16, frame->bs_code[1]);
1107
1108     if (s->sr_code[0] == 12)
1109         put_bits(&s->pb, 8, s->sr_code[1]);
1110     else if (s->sr_code[0] > 12)
1111         put_bits(&s->pb, 16, s->sr_code[1]);
1112
1113     flush_put_bits(&s->pb);
1114     crc = av_crc(av_crc_get_table(AV_CRC_8_ATM), 0, s->pb.buf,
1115                  put_bits_count(&s->pb) >> 3);
1116     put_bits(&s->pb, 8, crc);
1117 }
1118
1119
1120 static void write_subframes(FlacEncodeContext *s)
1121 {
1122     int ch;
1123
1124     for (ch = 0; ch < s->channels; ch++) {
1125         FlacSubframe *sub = &s->frame.subframes[ch];
1126         int i, p, porder, psize;
1127         int32_t *part_end;
1128         int32_t *res       =  sub->residual;
1129         int32_t *frame_end = &sub->residual[s->frame.blocksize];
1130
1131         /* subframe header */
1132         put_bits(&s->pb, 1, 0);
1133         put_bits(&s->pb, 6, sub->type_code);
1134         put_bits(&s->pb, 1, !!sub->wasted);
1135         if (sub->wasted)
1136             put_bits(&s->pb, sub->wasted, 1);
1137
1138         /* subframe */
1139         if (sub->type == FLAC_SUBFRAME_CONSTANT) {
1140             put_sbits(&s->pb, sub->obits, res[0]);
1141         } else if (sub->type == FLAC_SUBFRAME_VERBATIM) {
1142             while (res < frame_end)
1143                 put_sbits(&s->pb, sub->obits, *res++);
1144         } else {
1145             /* warm-up samples */
1146             for (i = 0; i < sub->order; i++)
1147                 put_sbits(&s->pb, sub->obits, *res++);
1148
1149             /* LPC coefficients */
1150             if (sub->type == FLAC_SUBFRAME_LPC) {
1151                 int cbits = s->options.lpc_coeff_precision;
1152                 put_bits( &s->pb, 4, cbits-1);
1153                 put_sbits(&s->pb, 5, sub->shift);
1154                 for (i = 0; i < sub->order; i++)
1155                     put_sbits(&s->pb, cbits, sub->coefs[i]);
1156             }
1157
1158             /* rice-encoded block */
1159             put_bits(&s->pb, 2, sub->rc.coding_mode - 4);
1160
1161             /* partition order */
1162             porder  = sub->rc.porder;
1163             psize   = s->frame.blocksize >> porder;
1164             put_bits(&s->pb, 4, porder);
1165
1166             /* residual */
1167             part_end  = &sub->residual[psize];
1168             for (p = 0; p < 1 << porder; p++) {
1169                 int k = sub->rc.params[p];
1170                 put_bits(&s->pb, sub->rc.coding_mode, k);
1171                 while (res < part_end)
1172                     set_sr_golomb_flac(&s->pb, *res++, k, INT32_MAX, 0);
1173                 part_end = FFMIN(frame_end, part_end + psize);
1174             }
1175         }
1176     }
1177 }
1178
1179
1180 static void write_frame_footer(FlacEncodeContext *s)
1181 {
1182     int crc;
1183     flush_put_bits(&s->pb);
1184     crc = av_bswap16(av_crc(av_crc_get_table(AV_CRC_16_ANSI), 0, s->pb.buf,
1185                             put_bits_count(&s->pb)>>3));
1186     put_bits(&s->pb, 16, crc);
1187     flush_put_bits(&s->pb);
1188 }
1189
1190
1191 static int write_frame(FlacEncodeContext *s, AVPacket *avpkt)
1192 {
1193     init_put_bits(&s->pb, avpkt->data, avpkt->size);
1194     write_frame_header(s);
1195     write_subframes(s);
1196     write_frame_footer(s);
1197     return put_bits_count(&s->pb) >> 3;
1198 }
1199
1200
1201 static int update_md5_sum(FlacEncodeContext *s, const void *samples)
1202 {
1203     const uint8_t *buf;
1204     int buf_size = s->frame.blocksize * s->channels *
1205                    ((s->avctx->bits_per_raw_sample + 7) / 8);
1206
1207     if (s->avctx->bits_per_raw_sample > 16 || HAVE_BIGENDIAN) {
1208         av_fast_malloc(&s->md5_buffer, &s->md5_buffer_size, buf_size);
1209         if (!s->md5_buffer)
1210             return AVERROR(ENOMEM);
1211     }
1212
1213     if (s->avctx->bits_per_raw_sample <= 16) {
1214         buf = (const uint8_t *)samples;
1215 #if HAVE_BIGENDIAN
1216         s->bdsp.bswap16_buf((uint16_t *) s->md5_buffer,
1217                             (const uint16_t *) samples, buf_size / 2);
1218         buf = s->md5_buffer;
1219 #endif
1220     } else {
1221         int i;
1222         const int32_t *samples0 = samples;
1223         uint8_t *tmp            = s->md5_buffer;
1224
1225         for (i = 0; i < s->frame.blocksize * s->channels; i++) {
1226             int32_t v = samples0[i] >> 8;
1227             *tmp++    = (v      ) & 0xFF;
1228             *tmp++    = (v >>  8) & 0xFF;
1229             *tmp++    = (v >> 16) & 0xFF;
1230         }
1231         buf = s->md5_buffer;
1232     }
1233     av_md5_update(s->md5ctx, buf, buf_size);
1234
1235     return 0;
1236 }
1237
1238
1239 static int flac_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
1240                              const AVFrame *frame, int *got_packet_ptr)
1241 {
1242     FlacEncodeContext *s;
1243     int frame_bytes, out_bytes, ret;
1244
1245     s = avctx->priv_data;
1246
1247     /* when the last block is reached, update the header in extradata */
1248     if (!frame) {
1249         s->max_framesize = s->max_encoded_framesize;
1250         av_md5_final(s->md5ctx, s->md5sum);
1251         write_streaminfo(s, avctx->extradata);
1252
1253         if (avctx->side_data_only_packets && !s->flushed) {
1254             uint8_t *side_data = av_packet_new_side_data(avpkt, AV_PKT_DATA_NEW_EXTRADATA,
1255                                                          avctx->extradata_size);
1256             if (!side_data)
1257                 return AVERROR(ENOMEM);
1258             memcpy(side_data, avctx->extradata, avctx->extradata_size);
1259
1260             avpkt->pts = s->next_pts;
1261
1262             *got_packet_ptr = 1;
1263             s->flushed = 1;
1264         }
1265
1266         return 0;
1267     }
1268
1269     /* change max_framesize for small final frame */
1270     if (frame->nb_samples < s->frame.blocksize) {
1271         s->max_framesize = ff_flac_get_max_frame_size(frame->nb_samples,
1272                                                       s->channels,
1273                                                       avctx->bits_per_raw_sample);
1274     }
1275
1276     init_frame(s, frame->nb_samples);
1277
1278     copy_samples(s, frame->data[0]);
1279
1280     channel_decorrelation(s);
1281
1282     remove_wasted_bits(s);
1283
1284     frame_bytes = encode_frame(s);
1285
1286     /* Fall back on verbatim mode if the compressed frame is larger than it
1287        would be if encoded uncompressed. */
1288     if (frame_bytes < 0 || frame_bytes > s->max_framesize) {
1289         s->frame.verbatim_only = 1;
1290         frame_bytes = encode_frame(s);
1291         if (frame_bytes < 0) {
1292             av_log(avctx, AV_LOG_ERROR, "Bad frame count\n");
1293             return frame_bytes;
1294         }
1295     }
1296
1297     if ((ret = ff_alloc_packet2(avctx, avpkt, frame_bytes)) < 0)
1298         return ret;
1299
1300     out_bytes = write_frame(s, avpkt);
1301
1302     s->frame_count++;
1303     s->sample_count += frame->nb_samples;
1304     if ((ret = update_md5_sum(s, frame->data[0])) < 0) {
1305         av_log(avctx, AV_LOG_ERROR, "Error updating MD5 checksum\n");
1306         return ret;
1307     }
1308     if (out_bytes > s->max_encoded_framesize)
1309         s->max_encoded_framesize = out_bytes;
1310     if (out_bytes < s->min_framesize)
1311         s->min_framesize = out_bytes;
1312
1313     avpkt->pts      = frame->pts;
1314     avpkt->duration = ff_samples_to_time_base(avctx, frame->nb_samples);
1315     avpkt->size     = out_bytes;
1316
1317     s->next_pts = avpkt->pts + avpkt->duration;
1318
1319     *got_packet_ptr = 1;
1320     return 0;
1321 }
1322
1323
1324 static av_cold int flac_encode_close(AVCodecContext *avctx)
1325 {
1326     if (avctx->priv_data) {
1327         FlacEncodeContext *s = avctx->priv_data;
1328         av_freep(&s->md5ctx);
1329         av_freep(&s->md5_buffer);
1330         ff_lpc_end(&s->lpc_ctx);
1331     }
1332     av_freep(&avctx->extradata);
1333     avctx->extradata_size = 0;
1334     return 0;
1335 }
1336
1337 #define FLAGS AV_OPT_FLAG_ENCODING_PARAM | AV_OPT_FLAG_AUDIO_PARAM
1338 static const AVOption options[] = {
1339 { "lpc_coeff_precision", "LPC coefficient precision", offsetof(FlacEncodeContext, options.lpc_coeff_precision), AV_OPT_TYPE_INT, {.i64 = 15 }, 0, MAX_LPC_PRECISION, FLAGS },
1340 { "lpc_type", "LPC algorithm", offsetof(FlacEncodeContext, options.lpc_type), AV_OPT_TYPE_INT, {.i64 = FF_LPC_TYPE_DEFAULT }, FF_LPC_TYPE_DEFAULT, FF_LPC_TYPE_NB-1, FLAGS, "lpc_type" },
1341 { "none",     NULL, 0, AV_OPT_TYPE_CONST, {.i64 = FF_LPC_TYPE_NONE },     INT_MIN, INT_MAX, FLAGS, "lpc_type" },
1342 { "fixed",    NULL, 0, AV_OPT_TYPE_CONST, {.i64 = FF_LPC_TYPE_FIXED },    INT_MIN, INT_MAX, FLAGS, "lpc_type" },
1343 { "levinson", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = FF_LPC_TYPE_LEVINSON }, INT_MIN, INT_MAX, FLAGS, "lpc_type" },
1344 { "cholesky", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = FF_LPC_TYPE_CHOLESKY }, INT_MIN, INT_MAX, FLAGS, "lpc_type" },
1345 { "lpc_passes", "Number of passes to use for Cholesky factorization during LPC analysis", offsetof(FlacEncodeContext, options.lpc_passes),  AV_OPT_TYPE_INT, {.i64 = 2 }, 1, INT_MAX, FLAGS },
1346 { "min_partition_order",  NULL, offsetof(FlacEncodeContext, options.min_partition_order),  AV_OPT_TYPE_INT, {.i64 = -1 },      -1, MAX_PARTITION_ORDER, FLAGS },
1347 { "max_partition_order",  NULL, offsetof(FlacEncodeContext, options.max_partition_order),  AV_OPT_TYPE_INT, {.i64 = -1 },      -1, MAX_PARTITION_ORDER, FLAGS },
1348 { "prediction_order_method", "Search method for selecting prediction order", offsetof(FlacEncodeContext, options.prediction_order_method), AV_OPT_TYPE_INT, {.i64 = -1 }, -1, ORDER_METHOD_LOG, FLAGS, "predm" },
1349 { "estimation", NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_EST },    INT_MIN, INT_MAX, FLAGS, "predm" },
1350 { "2level",     NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_2LEVEL }, INT_MIN, INT_MAX, FLAGS, "predm" },
1351 { "4level",     NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_4LEVEL }, INT_MIN, INT_MAX, FLAGS, "predm" },
1352 { "8level",     NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_8LEVEL }, INT_MIN, INT_MAX, FLAGS, "predm" },
1353 { "search",     NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_SEARCH }, INT_MIN, INT_MAX, FLAGS, "predm" },
1354 { "log",        NULL, 0, AV_OPT_TYPE_CONST, {.i64 = ORDER_METHOD_LOG },    INT_MIN, INT_MAX, FLAGS, "predm" },
1355 { "ch_mode", "Stereo decorrelation mode", offsetof(FlacEncodeContext, options.ch_mode), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, FLAC_CHMODE_MID_SIDE, FLAGS, "ch_mode" },
1356 { "auto",       NULL, 0, AV_OPT_TYPE_CONST, { .i64 = -1                      }, INT_MIN, INT_MAX, FLAGS, "ch_mode" },
1357 { "indep",      NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FLAC_CHMODE_INDEPENDENT }, INT_MIN, INT_MAX, FLAGS, "ch_mode" },
1358 { "left_side",  NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FLAC_CHMODE_LEFT_SIDE   }, INT_MIN, INT_MAX, FLAGS, "ch_mode" },
1359 { "right_side", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FLAC_CHMODE_RIGHT_SIDE  }, INT_MIN, INT_MAX, FLAGS, "ch_mode" },
1360 { "mid_side",   NULL, 0, AV_OPT_TYPE_CONST, { .i64 = FLAC_CHMODE_MID_SIDE    }, INT_MIN, INT_MAX, FLAGS, "ch_mode" },
1361 { NULL },
1362 };
1363
1364 static const AVClass flac_encoder_class = {
1365     "FLAC encoder",
1366     av_default_item_name,
1367     options,
1368     LIBAVUTIL_VERSION_INT,
1369 };
1370
1371 AVCodec ff_flac_encoder = {
1372     .name           = "flac",
1373     .long_name      = NULL_IF_CONFIG_SMALL("FLAC (Free Lossless Audio Codec)"),
1374     .type           = AVMEDIA_TYPE_AUDIO,
1375     .id             = AV_CODEC_ID_FLAC,
1376     .priv_data_size = sizeof(FlacEncodeContext),
1377     .init           = flac_encode_init,
1378     .encode2        = flac_encode_frame,
1379     .close          = flac_encode_close,
1380     .capabilities   = CODEC_CAP_SMALL_LAST_FRAME | CODEC_CAP_DELAY | CODEC_CAP_LOSSLESS,
1381     .sample_fmts    = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_S16,
1382                                                      AV_SAMPLE_FMT_S32,
1383                                                      AV_SAMPLE_FMT_NONE },
1384     .priv_class     = &flac_encoder_class,
1385 };