git.sesse.net Git - ffmpeg/blob - libavcodec/flacenc.c

   1 /**
   2  * FLAC audio encoder
   3  * Copyright (c) 2006  Justin Ruggles <justin.ruggles@gmail.com>
   4  *
   5  * This file is part of FFmpeg.
   6  *
   7  * FFmpeg is free software; you can redistribute it and/or
   8  * modify it under the terms of the GNU Lesser General Public
   9  * License as published by the Free Software Foundation; either
  10  * version 2.1 of the License, or (at your option) any later version.
  11  *
  12  * FFmpeg is distributed in the hope that it will be useful,
  13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  15  * Lesser General Public License for more details.
  16  *
  17  * You should have received a copy of the GNU Lesser General Public
  18  * License along with FFmpeg; if not, write to the Free Software
  19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20  */
  21
  22 #include "libavutil/crc.h"
  23 #include "libavutil/md5.h"
  24 #include "avcodec.h"
  25 #include "get_bits.h"
  26 #include "dsputil.h"
  27 #include "golomb.h"
  28 #include "lpc.h"
  29 #include "flac.h"
  30 #include "flacdata.h"
  31
  32 #define FLAC_SUBFRAME_CONSTANT  0
  33 #define FLAC_SUBFRAME_VERBATIM  1
  34 #define FLAC_SUBFRAME_FIXED     8
  35 #define FLAC_SUBFRAME_LPC      32
  36
  37 #define MAX_FIXED_ORDER     4
  38 #define MAX_PARTITION_ORDER 8
  39 #define MAX_PARTITIONS     (1 << MAX_PARTITION_ORDER)
  40 #define MAX_LPC_PRECISION  15
  41 #define MAX_LPC_SHIFT      15
  42 #define MAX_RICE_PARAM     14
  43
  44 typedef struct CompressionOptions {
  45     int compression_level;
  46     int block_time_ms;
  47     enum AVLPCType lpc_type;
  48     int lpc_passes;
  49     int lpc_coeff_precision;
  50     int min_prediction_order;
  51     int max_prediction_order;
  52     int prediction_order_method;
  53     int min_partition_order;
  54     int max_partition_order;
  55 } CompressionOptions;
  56
  57 typedef struct RiceContext {
  58     int porder;
  59     int params[MAX_PARTITIONS];
  60 } RiceContext;
  61
  62 typedef struct FlacSubframe {
  63     int type;
  64     int type_code;
  65     int obits;
  66     int order;
  67     int32_t coefs[MAX_LPC_ORDER];
  68     int shift;
  69     RiceContext rc;
  70     int32_t samples[FLAC_MAX_BLOCKSIZE];
  71     int32_t residual[FLAC_MAX_BLOCKSIZE+1];
  72 } FlacSubframe;
  73
  74 typedef struct FlacFrame {
  75     FlacSubframe subframes[FLAC_MAX_CHANNELS];
  76     int blocksize;
  77     int bs_code[2];
  78     uint8_t crc8;
  79     int ch_mode;
  80 } FlacFrame;
  81
  82 typedef struct FlacEncodeContext {
  83     PutBitContext pb;
  84     int channels;
  85     int samplerate;
  86     int sr_code[2];
  87     int max_blocksize;
  88     int min_framesize;
  89     int max_framesize;
  90     int max_encoded_framesize;
  91     uint32_t frame_count;
  92     uint64_t sample_count;
  93     uint8_t md5sum[16];
  94     FlacFrame frame;
  95     CompressionOptions options;
  96     AVCodecContext *avctx;
  97     DSPContext dsp;
  98     struct AVMD5 *md5ctx;
  99 } FlacEncodeContext;
 100
 101
 102 /**
 103  * Write streaminfo metadata block to byte array.
 104  */
 105 static void write_streaminfo(FlacEncodeContext *s, uint8_t *header)
 106 {
 107     PutBitContext pb;
 108
 109     memset(header, 0, FLAC_STREAMINFO_SIZE);
 110     init_put_bits(&pb, header, FLAC_STREAMINFO_SIZE);
 111
 112     /* streaminfo metadata block */
 113     put_bits(&pb, 16, s->max_blocksize);
 114     put_bits(&pb, 16, s->max_blocksize);
 115     put_bits(&pb, 24, s->min_framesize);
 116     put_bits(&pb, 24, s->max_framesize);
 117     put_bits(&pb, 20, s->samplerate);
 118     put_bits(&pb, 3, s->channels-1);
 119     put_bits(&pb, 5, 15);       /* bits per sample - 1 */
 120     /* write 36-bit sample count in 2 put_bits() calls */
 121     put_bits(&pb, 24, (s->sample_count & 0xFFFFFF000LL) >> 12);
 122     put_bits(&pb, 12,  s->sample_count & 0x000000FFFLL);
 123     flush_put_bits(&pb);
 124     memcpy(&header[18], s->md5sum, 16);
 125 }
 126
 127
 128 /**
 129  * Set blocksize based on samplerate.
 130  * Choose the closest predefined blocksize >= BLOCK_TIME_MS milliseconds.
 131  */
 132 static int select_blocksize(int samplerate, int block_time_ms)
 133 {
 134     int i;
 135     int target;
 136     int blocksize;
 137
 138     assert(samplerate > 0);
 139     blocksize = ff_flac_blocksize_table[1];
 140     target    = (samplerate * block_time_ms) / 1000;
 141     for (i = 0; i < 16; i++) {
 142         if (target >= ff_flac_blocksize_table[i] &&
 143             ff_flac_blocksize_table[i] > blocksize) {
 144             blocksize = ff_flac_blocksize_table[i];
 145         }
 146     }
 147     return blocksize;
 148 }
 149
 150
 151 static av_cold void dprint_compression_options(FlacEncodeContext *s)
 152 {
 153     AVCodecContext     *avctx = s->avctx;
 154     CompressionOptions *opt   = &s->options;
 155
 156     av_log(avctx, AV_LOG_DEBUG, " compression: %d\n", opt->compression_level);
 157
 158     switch (opt->lpc_type) {
 159     case AV_LPC_TYPE_NONE:
 160         av_log(avctx, AV_LOG_DEBUG, " lpc type: None\n");
 161         break;
 162     case AV_LPC_TYPE_FIXED:
 163         av_log(avctx, AV_LOG_DEBUG, " lpc type: Fixed pre-defined coefficients\n");
 164         break;
 165     case AV_LPC_TYPE_LEVINSON:
 166         av_log(avctx, AV_LOG_DEBUG, " lpc type: Levinson-Durbin recursion with Welch window\n");
 167         break;
 168     case AV_LPC_TYPE_CHOLESKY:
 169         av_log(avctx, AV_LOG_DEBUG, " lpc type: Cholesky factorization, %d pass%s\n",
 170                opt->lpc_passes, opt->lpc_passes == 1 ? "" : "es");
 171         break;
 172     }
 173
 174     av_log(avctx, AV_LOG_DEBUG, " prediction order: %d, %d\n",
 175            opt->min_prediction_order, opt->max_prediction_order);
 176
 177     switch (opt->prediction_order_method) {
 178     case ORDER_METHOD_EST:
 179         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "estimate");
 180         break;
 181     case ORDER_METHOD_2LEVEL:
 182         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "2-level");
 183         break;
 184     case ORDER_METHOD_4LEVEL:
 185         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "4-level");
 186         break;
 187     case ORDER_METHOD_8LEVEL:
 188         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "8-level");
 189         break;
 190     case ORDER_METHOD_SEARCH:
 191         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "full search");
 192         break;
 193     case ORDER_METHOD_LOG:
 194         av_log(avctx, AV_LOG_DEBUG, " order method: %s\n", "log search");
 195         break;
 196     }
 197
 198
 199     av_log(avctx, AV_LOG_DEBUG, " partition order: %d, %d\n",
 200            opt->min_partition_order, opt->max_partition_order);
 201
 202     av_log(avctx, AV_LOG_DEBUG, " block size: %d\n", avctx->frame_size);
 203
 204     av_log(avctx, AV_LOG_DEBUG, " lpc precision: %d\n",
 205            opt->lpc_coeff_precision);
 206 }
 207
 208
 209 static av_cold int flac_encode_init(AVCodecContext *avctx)
 210 {
 211     int freq = avctx->sample_rate;
 212     int channels = avctx->channels;
 213     FlacEncodeContext *s = avctx->priv_data;
 214     int i, level;
 215     uint8_t *streaminfo;
 216
 217     s->avctx = avctx;
 218
 219     dsputil_init(&s->dsp, avctx);
 220
 221     if (avctx->sample_fmt != SAMPLE_FMT_S16)
 222         return -1;
 223
 224     if (channels < 1 || channels > FLAC_MAX_CHANNELS)
 225         return -1;
 226     s->channels = channels;
 227
 228     /* find samplerate in table */
 229     if (freq < 1)
 230         return -1;
 231     for (i = 4; i < 12; i++) {
 232         if (freq == ff_flac_sample_rate_table[i]) {
 233             s->samplerate = ff_flac_sample_rate_table[i];
 234             s->sr_code[0] = i;
 235             s->sr_code[1] = 0;
 236             break;
 237         }
 238     }
 239     /* if not in table, samplerate is non-standard */
 240     if (i == 12) {
 241         if (freq % 1000 == 0 && freq < 255000) {
 242             s->sr_code[0] = 12;
 243             s->sr_code[1] = freq / 1000;
 244         } else if (freq % 10 == 0 && freq < 655350) {
 245             s->sr_code[0] = 14;
 246             s->sr_code[1] = freq / 10;
 247         } else if (freq < 65535) {
 248             s->sr_code[0] = 13;
 249             s->sr_code[1] = freq;
 250         } else {
 251             return -1;
 252         }
 253         s->samplerate = freq;
 254     }
 255
 256     /* set compression option defaults based on avctx->compression_level */
 257     if (avctx->compression_level < 0)
 258         s->options.compression_level = 5;
 259     else
 260         s->options.compression_level = avctx->compression_level;
 261
 262     level = s->options.compression_level;
 263     if (level > 12) {
 264         av_log(avctx, AV_LOG_ERROR, "invalid compression level: %d\n",
 265                s->options.compression_level);
 266         return -1;
 267     }
 268
 269     s->options.block_time_ms = ((int[]){ 27, 27, 27,105,105,105,105,105,105,105,105,105,105})[level];
 270
 271     s->options.lpc_type      = ((int[]){ AV_LPC_TYPE_FIXED,    AV_LPC_TYPE_FIXED,    AV_LPC_TYPE_FIXED,
 272                                          AV_LPC_TYPE_LEVINSON, AV_LPC_TYPE_LEVINSON, AV_LPC_TYPE_LEVINSON,
 273                                          AV_LPC_TYPE_LEVINSON, AV_LPC_TYPE_LEVINSON, AV_LPC_TYPE_LEVINSON,
 274                                          AV_LPC_TYPE_LEVINSON, AV_LPC_TYPE_LEVINSON, AV_LPC_TYPE_LEVINSON,
 275                                          AV_LPC_TYPE_LEVINSON})[level];
 276
 277     s->options.min_prediction_order = ((int[]){  2,  0,  0,  1,  1,  1,  1,  1,  1,  1,  1,  1,  1})[level];
 278     s->options.max_prediction_order = ((int[]){  3,  4,  4,  6,  8,  8,  8,  8, 12, 12, 12, 32, 32})[level];
 279
 280     s->options.prediction_order_method = ((int[]){ ORDER_METHOD_EST,    ORDER_METHOD_EST,    ORDER_METHOD_EST,
 281                                                    ORDER_METHOD_EST,    ORDER_METHOD_EST,    ORDER_METHOD_EST,
 282                                                    ORDER_METHOD_4LEVEL, ORDER_METHOD_LOG,    ORDER_METHOD_4LEVEL,
 283                                                    ORDER_METHOD_LOG,    ORDER_METHOD_SEARCH, ORDER_METHOD_LOG,
 284                                                    ORDER_METHOD_SEARCH})[level];
 285
 286     s->options.min_partition_order = ((int[]){  2,  2,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0,  0})[level];
 287     s->options.max_partition_order = ((int[]){  2,  2,  3,  3,  3,  8,  8,  8,  8,  8,  8,  8,  8})[level];
 288
 289     /* set compression option overrides from AVCodecContext */
 290 #if LIBAVCODEC_VERSION_MAJOR < 53
 291     /* for compatibility with deprecated AVCodecContext.use_lpc */
 292     if (avctx->use_lpc == 0) {
 293         s->options.lpc_type = AV_LPC_TYPE_FIXED;
 294     } else if (avctx->use_lpc == 1) {
 295         s->options.lpc_type = AV_LPC_TYPE_LEVINSON;
 296     } else if (avctx->use_lpc > 1) {
 297         s->options.lpc_type   = AV_LPC_TYPE_CHOLESKY;
 298         s->options.lpc_passes = avctx->use_lpc - 1;
 299     }
 300 #endif
 301     if (avctx->lpc_type > AV_LPC_TYPE_DEFAULT) {
 302         if (avctx->lpc_type > AV_LPC_TYPE_CHOLESKY) {
 303             av_log(avctx, AV_LOG_ERROR, "unknown lpc type: %d\n", avctx->lpc_type);
 304             return -1;
 305         }
 306         s->options.lpc_type = avctx->lpc_type;
 307         if (s->options.lpc_type == AV_LPC_TYPE_CHOLESKY) {
 308             if (avctx->lpc_passes < 0) {
 309                 // default number of passes for Cholesky
 310                 s->options.lpc_passes = 2;
 311             } else if (avctx->lpc_passes == 0) {
 312                 av_log(avctx, AV_LOG_ERROR, "invalid number of lpc passes: %d\n",
 313                        avctx->lpc_passes);
 314                 return -1;
 315             } else {
 316                 s->options.lpc_passes = avctx->lpc_passes;
 317             }
 318         }
 319     }
 320
 321     if (s->options.lpc_type == AV_LPC_TYPE_NONE) {
 322         s->options.min_prediction_order = 0;
 323     } else if (avctx->min_prediction_order >= 0) {
 324         if (s->options.lpc_type == AV_LPC_TYPE_FIXED) {
 325             if (avctx->min_prediction_order > MAX_FIXED_ORDER) {
 326                 av_log(avctx, AV_LOG_ERROR, "invalid min prediction order: %d\n",
 327                        avctx->min_prediction_order);
 328                 return -1;
 329             }
 330         } else if (avctx->min_prediction_order < MIN_LPC_ORDER ||
 331                    avctx->min_prediction_order > MAX_LPC_ORDER) {
 332             av_log(avctx, AV_LOG_ERROR, "invalid min prediction order: %d\n",
 333                    avctx->min_prediction_order);
 334             return -1;
 335         }
 336         s->options.min_prediction_order = avctx->min_prediction_order;
 337     }
 338     if (s->options.lpc_type == AV_LPC_TYPE_NONE) {
 339         s->options.max_prediction_order = 0;
 340     } else if (avctx->max_prediction_order >= 0) {
 341         if (s->options.lpc_type == AV_LPC_TYPE_FIXED) {
 342             if (avctx->max_prediction_order > MAX_FIXED_ORDER) {
 343                 av_log(avctx, AV_LOG_ERROR, "invalid max prediction order: %d\n",
 344                        avctx->max_prediction_order);
 345                 return -1;
 346             }
 347         } else if (avctx->max_prediction_order < MIN_LPC_ORDER ||
 348                    avctx->max_prediction_order > MAX_LPC_ORDER) {
 349             av_log(avctx, AV_LOG_ERROR, "invalid max prediction order: %d\n",
 350                    avctx->max_prediction_order);
 351             return -1;
 352         }
 353         s->options.max_prediction_order = avctx->max_prediction_order;
 354     }
 355     if (s->options.max_prediction_order < s->options.min_prediction_order) {
 356         av_log(avctx, AV_LOG_ERROR, "invalid prediction orders: min=%d max=%d\n",
 357                s->options.min_prediction_order, s->options.max_prediction_order);
 358         return -1;
 359     }
 360
 361     if (avctx->prediction_order_method >= 0) {
 362         if (avctx->prediction_order_method > ORDER_METHOD_LOG) {
 363             av_log(avctx, AV_LOG_ERROR, "invalid prediction order method: %d\n",
 364                    avctx->prediction_order_method);
 365             return -1;
 366         }
 367         s->options.prediction_order_method = avctx->prediction_order_method;
 368     }
 369
 370     if (avctx->min_partition_order >= 0) {
 371         if (avctx->min_partition_order > MAX_PARTITION_ORDER) {
 372             av_log(avctx, AV_LOG_ERROR, "invalid min partition order: %d\n",
 373                    avctx->min_partition_order);
 374             return -1;
 375         }
 376         s->options.min_partition_order = avctx->min_partition_order;
 377     }
 378     if (avctx->max_partition_order >= 0) {
 379         if (avctx->max_partition_order > MAX_PARTITION_ORDER) {
 380             av_log(avctx, AV_LOG_ERROR, "invalid max partition order: %d\n",
 381                    avctx->max_partition_order);
 382             return -1;
 383         }
 384         s->options.max_partition_order = avctx->max_partition_order;
 385     }
 386     if (s->options.max_partition_order < s->options.min_partition_order) {
 387         av_log(avctx, AV_LOG_ERROR, "invalid partition orders: min=%d max=%d\n",
 388                s->options.min_partition_order, s->options.max_partition_order);
 389         return -1;
 390     }
 391
 392     if (avctx->frame_size > 0) {
 393         if (avctx->frame_size < FLAC_MIN_BLOCKSIZE ||
 394                 avctx->frame_size > FLAC_MAX_BLOCKSIZE) {
 395             av_log(avctx, AV_LOG_ERROR, "invalid block size: %d\n",
 396                    avctx->frame_size);
 397             return -1;
 398         }
 399     } else {
 400         s->avctx->frame_size = select_blocksize(s->samplerate, s->options.block_time_ms);
 401     }
 402     s->max_blocksize = s->avctx->frame_size;
 403
 404     /* set LPC precision */
 405     if (avctx->lpc_coeff_precision > 0) {
 406         if (avctx->lpc_coeff_precision > MAX_LPC_PRECISION) {
 407             av_log(avctx, AV_LOG_ERROR, "invalid lpc coeff precision: %d\n",
 408                    avctx->lpc_coeff_precision);
 409             return -1;
 410         }
 411         s->options.lpc_coeff_precision = avctx->lpc_coeff_precision;
 412     } else {
 413         /* default LPC precision */
 414         s->options.lpc_coeff_precision = 15;
 415     }
 416
 417     /* set maximum encoded frame size in verbatim mode */
 418     s->max_framesize = ff_flac_get_max_frame_size(s->avctx->frame_size,
 419                                                   s->channels, 16);
 420
 421     /* initialize MD5 context */
 422     s->md5ctx = av_malloc(av_md5_size);
 423     if (!s->md5ctx)
 424         return AVERROR(ENOMEM);
 425     av_md5_init(s->md5ctx);
 426
 427     streaminfo = av_malloc(FLAC_STREAMINFO_SIZE);
 428     if (!streaminfo)
 429         return AVERROR(ENOMEM);
 430     write_streaminfo(s, streaminfo);
 431     avctx->extradata = streaminfo;
 432     avctx->extradata_size = FLAC_STREAMINFO_SIZE;
 433
 434     s->frame_count   = 0;
 435     s->min_framesize = s->max_framesize;
 436
 437     avctx->coded_frame = avcodec_alloc_frame();
 438     if (!avctx->coded_frame)
 439         return AVERROR(ENOMEM);
 440
 441     dprint_compression_options(s);
 442
 443     return 0;
 444 }
 445
 446
 447 static void init_frame(FlacEncodeContext *s)
 448 {
 449     int i, ch;
 450     FlacFrame *frame;
 451
 452     frame = &s->frame;
 453
 454     for (i = 0; i < 16; i++) {
 455         if (s->avctx->frame_size == ff_flac_blocksize_table[i]) {
 456             frame->blocksize  = ff_flac_blocksize_table[i];
 457             frame->bs_code[0] = i;
 458             frame->bs_code[1] = 0;
 459             break;
 460         }
 461     }
 462     if (i == 16) {
 463         frame->blocksize = s->avctx->frame_size;
 464         if (frame->blocksize <= 256) {
 465             frame->bs_code[0] = 6;
 466             frame->bs_code[1] = frame->blocksize-1;
 467         } else {
 468             frame->bs_code[0] = 7;
 469             frame->bs_code[1] = frame->blocksize-1;
 470         }
 471     }
 472
 473     for (ch = 0; ch < s->channels; ch++)
 474         frame->subframes[ch].obits = 16;
 475 }
 476
 477
 478 /**
 479  * Copy channel-interleaved input samples into separate subframes.
 480  */
 481 static void copy_samples(FlacEncodeContext *s, const int16_t *samples)
 482 {
 483     int i, j, ch;
 484     FlacFrame *frame;
 485
 486     frame = &s->frame;
 487     for (i = 0, j = 0; i < frame->blocksize; i++)
 488         for (ch = 0; ch < s->channels; ch++, j++)
 489             frame->subframes[ch].samples[i] = samples[j];
 490 }
 491
 492
 493 #define rice_encode_count(sum, n, k) (((n)*((k)+1))+((sum-(n>>1))>>(k)))
 494
 495 /**
 496  * Solve for d/dk(rice_encode_count) = n-((sum-(n>>1))>>(k+1)) = 0.
 497  */
 498 static int find_optimal_param(uint32_t sum, int n)
 499 {
 500     int k;
 501     uint32_t sum2;
 502
 503     if (sum <= n >> 1)
 504         return 0;
 505     sum2 = sum - (n >> 1);
 506     k    = av_log2(n < 256 ? FASTDIV(sum2, n) : sum2 / n);
 507     return FFMIN(k, MAX_RICE_PARAM);
 508 }
 509
 510
 511 static uint32_t calc_optimal_rice_params(RiceContext *rc, int porder,
 512                                          uint32_t *sums, int n, int pred_order)
 513 {
 514     int i;
 515     int k, cnt, part;
 516     uint32_t all_bits;
 517
 518     part     = (1 << porder);
 519     all_bits = 4 * part;
 520
 521     cnt = (n >> porder) - pred_order;
 522     for (i = 0; i < part; i++) {
 523         k = find_optimal_param(sums[i], cnt);
 524         rc->params[i] = k;
 525         all_bits += rice_encode_count(sums[i], cnt, k);
 526         cnt = n >> porder;
 527     }
 528
 529     rc->porder = porder;
 530
 531     return all_bits;
 532 }
 533
 534
 535 static void calc_sums(int pmin, int pmax, uint32_t *data, int n, int pred_order,
 536                       uint32_t sums[][MAX_PARTITIONS])
 537 {
 538     int i, j;
 539     int parts;
 540     uint32_t *res, *res_end;
 541
 542     /* sums for highest level */
 543     parts   = (1 << pmax);
 544     res     = &data[pred_order];
 545     res_end = &data[n >> pmax];
 546     for (i = 0; i < parts; i++) {
 547         uint32_t sum = 0;
 548         while (res < res_end)
 549             sum += *(res++);
 550         sums[pmax][i] = sum;
 551         res_end += n >> pmax;
 552     }
 553     /* sums for lower levels */
 554     for (i = pmax - 1; i >= pmin; i--) {
 555         parts = (1 << i);
 556         for (j = 0; j < parts; j++)
 557             sums[i][j] = sums[i+1][2*j] + sums[i+1][2*j+1];
 558     }
 559 }
 560
 561
 562 static uint32_t calc_rice_params(RiceContext *rc, int pmin, int pmax,
 563                                  int32_t *data, int n, int pred_order)
 564 {
 565     int i;
 566     uint32_t bits[MAX_PARTITION_ORDER+1];
 567     int opt_porder;
 568     RiceContext tmp_rc;
 569     uint32_t *udata;
 570     uint32_t sums[MAX_PARTITION_ORDER+1][MAX_PARTITIONS];
 571
 572     assert(pmin >= 0 && pmin <= MAX_PARTITION_ORDER);
 573     assert(pmax >= 0 && pmax <= MAX_PARTITION_ORDER);
 574     assert(pmin <= pmax);
 575
 576     udata = av_malloc(n * sizeof(uint32_t));
 577     for (i = 0; i < n; i++)
 578         udata[i] = (2*data[i]) ^ (data[i]>>31);
 579
 580     calc_sums(pmin, pmax, udata, n, pred_order, sums);
 581
 582     opt_porder = pmin;
 583     bits[pmin] = UINT32_MAX;
 584     for (i = pmin; i <= pmax; i++) {
 585         bits[i] = calc_optimal_rice_params(&tmp_rc, i, sums[i], n, pred_order);
 586         if (bits[i] <= bits[opt_porder]) {
 587             opt_porder = i;
 588             *rc = tmp_rc;
 589         }
 590     }
 591
 592     av_freep(&udata);
 593     return bits[opt_porder];
 594 }
 595
 596
 597 static int get_max_p_order(int max_porder, int n, int order)
 598 {
 599     int porder = FFMIN(max_porder, av_log2(n^(n-1)));
 600     if (order > 0)
 601         porder = FFMIN(porder, av_log2(n/order));
 602     return porder;
 603 }
 604
 605
 606 static uint32_t calc_rice_params_fixed(RiceContext *rc, int pmin, int pmax,
 607                                        int32_t *data, int n, int pred_order,
 608                                        int bps)
 609 {
 610     uint32_t bits;
 611     pmin  = get_max_p_order(pmin, n, pred_order);
 612     pmax  = get_max_p_order(pmax, n, pred_order);
 613     bits  = pred_order * bps + 6;
 614     bits += calc_rice_params(rc, pmin, pmax, data, n, pred_order);
 615     return bits;
 616 }
 617
 618
 619 static uint32_t calc_rice_params_lpc(RiceContext *rc, int pmin, int pmax,
 620                                      int32_t *data, int n, int pred_order,
 621                                      int bps, int precision)
 622 {
 623     uint32_t bits;
 624     pmin  = get_max_p_order(pmin, n, pred_order);
 625     pmax  = get_max_p_order(pmax, n, pred_order);
 626     bits  = pred_order*bps + 4 + 5 + pred_order*precision + 6;
 627     bits += calc_rice_params(rc, pmin, pmax, data, n, pred_order);
 628     return bits;
 629 }
 630
 631
 632 static void encode_residual_verbatim(int32_t *res, int32_t *smp, int n)
 633 {
 634     assert(n > 0);
 635     memcpy(res, smp, n * sizeof(int32_t));
 636 }
 637
 638
 639 static void encode_residual_fixed(int32_t *res, const int32_t *smp, int n,
 640                                   int order)
 641 {
 642     int i;
 643
 644     for (i = 0; i < order; i++)
 645         res[i] = smp[i];
 646
 647     if (order == 0) {
 648         for (i = order; i < n; i++)
 649             res[i] = smp[i];
 650     } else if (order == 1) {
 651         for (i = order; i < n; i++)
 652             res[i] = smp[i] - smp[i-1];
 653     } else if (order == 2) {
 654         int a = smp[order-1] - smp[order-2];
 655         for (i = order; i < n; i += 2) {
 656             int b    = smp[i  ] - smp[i-1];
 657             res[i]   = b - a;
 658             a        = smp[i+1] - smp[i  ];
 659             res[i+1] = a - b;
 660         }
 661     } else if (order == 3) {
 662         int a = smp[order-1] -   smp[order-2];
 663         int c = smp[order-1] - 2*smp[order-2] + smp[order-3];
 664         for (i = order; i < n; i += 2) {
 665             int b    = smp[i  ] - smp[i-1];
 666             int d    = b - a;
 667             res[i]   = d - c;
 668             a        = smp[i+1] - smp[i  ];
 669             c        = a - b;
 670             res[i+1] = c - d;
 671         }
 672     } else {
 673         int a = smp[order-1] -   smp[order-2];
 674         int c = smp[order-1] - 2*smp[order-2] +   smp[order-3];
 675         int e = smp[order-1] - 3*smp[order-2] + 3*smp[order-3] - smp[order-4];
 676         for (i = order; i < n; i += 2) {
 677             int b    = smp[i  ] - smp[i-1];
 678             int d    = b - a;
 679             int f    = d - c;
 680             res[i  ] = f - e;
 681             a        = smp[i+1] - smp[i  ];
 682             c        = a - b;
 683             e        = c - d;
 684             res[i+1] = e - f;
 685         }
 686     }
 687 }
 688
 689
 690 #define LPC1(x) {\
 691     int c = coefs[(x)-1];\
 692     p0   += c * s;\
 693     s     = smp[i-(x)+1];\
 694     p1   += c * s;\
 695 }
 696
 697 static av_always_inline void encode_residual_lpc_unrolled(int32_t *res,
 698                                     const int32_t *smp, int n, int order,
 699                                     const int32_t *coefs, int shift, int big)
 700 {
 701     int i;
 702     for (i = order; i < n; i += 2) {
 703         int s  = smp[i-order];
 704         int p0 = 0, p1 = 0;
 705         if (big) {
 706             switch (order) {
 707             case 32: LPC1(32)
 708             case 31: LPC1(31)
 709             case 30: LPC1(30)
 710             case 29: LPC1(29)
 711             case 28: LPC1(28)
 712             case 27: LPC1(27)
 713             case 26: LPC1(26)
 714             case 25: LPC1(25)
 715             case 24: LPC1(24)
 716             case 23: LPC1(23)
 717             case 22: LPC1(22)
 718             case 21: LPC1(21)
 719             case 20: LPC1(20)
 720             case 19: LPC1(19)
 721             case 18: LPC1(18)
 722             case 17: LPC1(17)
 723             case 16: LPC1(16)
 724             case 15: LPC1(15)
 725             case 14: LPC1(14)
 726             case 13: LPC1(13)
 727             case 12: LPC1(12)
 728             case 11: LPC1(11)
 729             case 10: LPC1(10)
 730             case  9: LPC1( 9)
 731                      LPC1( 8)
 732                      LPC1( 7)
 733                      LPC1( 6)
 734                      LPC1( 5)
 735                      LPC1( 4)
 736                      LPC1( 3)
 737                      LPC1( 2)
 738                      LPC1( 1)
 739             }
 740         } else {
 741             switch (order) {
 742             case  8: LPC1( 8)
 743             case  7: LPC1( 7)
 744             case  6: LPC1( 6)
 745             case  5: LPC1( 5)
 746             case  4: LPC1( 4)
 747             case  3: LPC1( 3)
 748             case  2: LPC1( 2)
 749             case  1: LPC1( 1)
 750             }
 751         }
 752         res[i  ] = smp[i  ] - (p0 >> shift);
 753         res[i+1] = smp[i+1] - (p1 >> shift);
 754     }
 755 }
 756
 757
 758 static void encode_residual_lpc(int32_t *res, const int32_t *smp, int n,
 759                                 int order, const int32_t *coefs, int shift)
 760 {
 761     int i;
 762     for (i = 0; i < order; i++)
 763         res[i] = smp[i];
 764 #if CONFIG_SMALL
 765     for (i = order; i < n; i += 2) {
 766         int j;
 767         int s  = smp[i];
 768         int p0 = 0, p1 = 0;
 769         for (j = 0; j < order; j++) {
 770             int c = coefs[j];
 771             p1   += c * s;
 772             s     = smp[i-j-1];
 773             p0   += c * s;
 774         }
 775         res[i  ] = smp[i  ] - (p0 >> shift);
 776         res[i+1] = smp[i+1] - (p1 >> shift);
 777     }
 778 #else
 779     switch (order) {
 780     case  1: encode_residual_lpc_unrolled(res, smp, n, 1, coefs, shift, 0); break;
 781     case  2: encode_residual_lpc_unrolled(res, smp, n, 2, coefs, shift, 0); break;
 782     case  3: encode_residual_lpc_unrolled(res, smp, n, 3, coefs, shift, 0); break;
 783     case  4: encode_residual_lpc_unrolled(res, smp, n, 4, coefs, shift, 0); break;
 784     case  5: encode_residual_lpc_unrolled(res, smp, n, 5, coefs, shift, 0); break;
 785     case  6: encode_residual_lpc_unrolled(res, smp, n, 6, coefs, shift, 0); break;
 786     case  7: encode_residual_lpc_unrolled(res, smp, n, 7, coefs, shift, 0); break;
 787     case  8: encode_residual_lpc_unrolled(res, smp, n, 8, coefs, shift, 0); break;
 788     default: encode_residual_lpc_unrolled(res, smp, n, order, coefs, shift, 1); break;
 789     }
 790 #endif
 791 }
 792
 793
 794 static int encode_residual(FlacEncodeContext *ctx, int ch)
 795 {
 796     int i, n;
 797     int min_order, max_order, opt_order, precision, omethod;
 798     int min_porder, max_porder;
 799     FlacFrame *frame;
 800     FlacSubframe *sub;
 801     int32_t coefs[MAX_LPC_ORDER][MAX_LPC_ORDER];
 802     int shift[MAX_LPC_ORDER];
 803     int32_t *res, *smp;
 804
 805     frame = &ctx->frame;
 806     sub   = &frame->subframes[ch];
 807     res   = sub->residual;
 808     smp   = sub->samples;
 809     n     = frame->blocksize;
 810
 811     /* CONSTANT */
 812     for (i = 1; i < n; i++)
 813         if(smp[i] != smp[0])
 814             break;
 815     if (i == n) {
 816         sub->type = sub->type_code = FLAC_SUBFRAME_CONSTANT;
 817         res[0] = smp[0];
 818         return sub->obits;
 819     }
 820
 821     /* VERBATIM */
 822     if (n < 5) {
 823         sub->type = sub->type_code = FLAC_SUBFRAME_VERBATIM;
 824         encode_residual_verbatim(res, smp, n);
 825         return sub->obits * n;
 826     }
 827
 828     min_order  = ctx->options.min_prediction_order;
 829     max_order  = ctx->options.max_prediction_order;
 830     min_porder = ctx->options.min_partition_order;
 831     max_porder = ctx->options.max_partition_order;
 832     precision  = ctx->options.lpc_coeff_precision;
 833     omethod    = ctx->options.prediction_order_method;
 834
 835     /* FIXED */
 836     if (ctx->options.lpc_type == AV_LPC_TYPE_NONE  ||
 837         ctx->options.lpc_type == AV_LPC_TYPE_FIXED || n <= max_order) {
 838         uint32_t bits[MAX_FIXED_ORDER+1];
 839         if (max_order > MAX_FIXED_ORDER)
 840             max_order = MAX_FIXED_ORDER;
 841         opt_order = 0;
 842         bits[0]   = UINT32_MAX;
 843         for (i = min_order; i <= max_order; i++) {
 844             encode_residual_fixed(res, smp, n, i);
 845             bits[i] = calc_rice_params_fixed(&sub->rc, min_porder, max_porder, res,
 846                                              n, i, sub->obits);
 847             if (bits[i] < bits[opt_order])
 848                 opt_order = i;
 849         }
 850         sub->order     = opt_order;
 851         sub->type      = FLAC_SUBFRAME_FIXED;
 852         sub->type_code = sub->type | sub->order;
 853         if (sub->order != max_order) {
 854             encode_residual_fixed(res, smp, n, sub->order);
 855             return calc_rice_params_fixed(&sub->rc, min_porder, max_porder, res, n,
 856                                           sub->order, sub->obits);
 857         }
 858         return bits[sub->order];
 859     }
 860
 861     /* LPC */
 862     opt_order = ff_lpc_calc_coefs(&ctx->dsp, smp, n, min_order, max_order,
 863                                   precision, coefs, shift, ctx->options.lpc_type,
 864                                   ctx->options.lpc_passes, omethod,
 865                                   MAX_LPC_SHIFT, 0);
 866
 867     if (omethod == ORDER_METHOD_2LEVEL ||
 868         omethod == ORDER_METHOD_4LEVEL ||
 869         omethod == ORDER_METHOD_8LEVEL) {
 870         int levels = 1 << omethod;
 871         uint32_t bits[1 << ORDER_METHOD_8LEVEL];
 872         int order;
 873         int opt_index   = levels-1;
 874         opt_order       = max_order-1;
 875         bits[opt_index] = UINT32_MAX;
 876         for (i = levels-1; i >= 0; i--) {
 877             order = min_order + (((max_order-min_order+1) * (i+1)) / levels)-1;
 878             if (order < 0)
 879                 order = 0;
 880             encode_residual_lpc(res, smp, n, order+1, coefs[order], shift[order]);
 881             bits[i] = calc_rice_params_lpc(&sub->rc, min_porder, max_porder,
 882                                            res, n, order+1, sub->obits, precision);
 883             if (bits[i] < bits[opt_index]) {
 884                 opt_index = i;
 885                 opt_order = order;
 886             }
 887         }
 888         opt_order++;
 889     } else if (omethod == ORDER_METHOD_SEARCH) {
 890         // brute-force optimal order search
 891         uint32_t bits[MAX_LPC_ORDER];
 892         opt_order = 0;
 893         bits[0]   = UINT32_MAX;
 894         for (i = min_order-1; i < max_order; i++) {
 895             encode_residual_lpc(res, smp, n, i+1, coefs[i], shift[i]);
 896             bits[i] = calc_rice_params_lpc(&sub->rc, min_porder, max_porder,
 897                                            res, n, i+1, sub->obits, precision);
 898             if (bits[i] < bits[opt_order])
 899                 opt_order = i;
 900         }
 901         opt_order++;
 902     } else if (omethod == ORDER_METHOD_LOG) {
 903         uint32_t bits[MAX_LPC_ORDER];
 904         int step;
 905
 906         opt_order = min_order - 1 + (max_order-min_order)/3;
 907         memset(bits, -1, sizeof(bits));
 908
 909         for (step = 16; step; step >>= 1) {
 910             int last = opt_order;
 911             for (i = last-step; i <= last+step; i += step) {
 912                 if (i < min_order-1 || i >= max_order || bits[i] < UINT32_MAX)
 913                     continue;
 914                 encode_residual_lpc(res, smp, n, i+1, coefs[i], shift[i]);
 915                 bits[i] = calc_rice_params_lpc(&sub->rc, min_porder, max_porder,
 916                                                res, n, i+1, sub->obits,
 917                                                precision);
 918                 if (bits[i] < bits[opt_order])
 919                     opt_order = i;
 920             }
 921         }
 922         opt_order++;
 923     }
 924
 925     sub->order     = opt_order;
 926     sub->type      = FLAC_SUBFRAME_LPC;
 927     sub->type_code = sub->type | (sub->order-1);
 928     sub->shift     = shift[sub->order-1];
 929     for (i = 0; i < sub->order; i++)
 930         sub->coefs[i] = coefs[sub->order-1][i];
 931
 932     encode_residual_lpc(res, smp, n, sub->order, sub->coefs, sub->shift);
 933
 934     return calc_rice_params_lpc(&sub->rc, min_porder, max_porder, res, n,
 935                                 sub->order, sub->obits, precision);
 936 }
 937
 938
 939 static int encode_residual_v(FlacEncodeContext *ctx, int ch)
 940 {
 941     int i, n;
 942     FlacFrame *frame;
 943     FlacSubframe *sub;
 944     int32_t *res, *smp;
 945
 946     frame = &ctx->frame;
 947     sub   = &frame->subframes[ch];
 948     res   = sub->residual;
 949     smp   = sub->samples;
 950     n     = frame->blocksize;
 951
 952     /* CONSTANT */
 953     for (i = 1; i < n; i++)
 954         if (smp[i] != smp[0])
 955             break;
 956     if (i == n) {
 957         sub->type = sub->type_code = FLAC_SUBFRAME_CONSTANT;
 958         res[0]    = smp[0];
 959         return sub->obits;
 960     }
 961
 962     /* VERBATIM */
 963     sub->type = sub->type_code = FLAC_SUBFRAME_VERBATIM;
 964     encode_residual_verbatim(res, smp, n);
 965     return sub->obits * n;
 966 }
 967
 968
 969 static int estimate_stereo_mode(int32_t *left_ch, int32_t *right_ch, int n)
 970 {
 971     int i, best;
 972     int32_t lt, rt;
 973     uint64_t sum[4];
 974     uint64_t score[4];
 975     int k;
 976
 977     /* calculate sum of 2nd order residual for each channel */
 978     sum[0] = sum[1] = sum[2] = sum[3] = 0;
 979     for (i = 2; i < n; i++) {
 980         lt = left_ch[i]  - 2*left_ch[i-1]  + left_ch[i-2];
 981         rt = right_ch[i] - 2*right_ch[i-1] + right_ch[i-2];
 982         sum[2] += FFABS((lt + rt) >> 1);
 983         sum[3] += FFABS(lt - rt);
 984         sum[0] += FFABS(lt);
 985         sum[1] += FFABS(rt);
 986     }
 987     /* estimate bit counts */
 988     for (i = 0; i < 4; i++) {
 989         k      = find_optimal_param(2 * sum[i], n);
 990         sum[i] = rice_encode_count( 2 * sum[i], n, k);
 991     }
 992
 993     /* calculate score for each mode */
 994     score[0] = sum[0] + sum[1];
 995     score[1] = sum[0] + sum[3];
 996     score[2] = sum[1] + sum[3];
 997     score[3] = sum[2] + sum[3];
 998
 999     /* return mode with lowest score */
1000     best = 0;
1001     for (i = 1; i < 4; i++)
1002         if (score[i] < score[best])
1003             best = i;
1004     if (best == 0) {
1005         return FLAC_CHMODE_INDEPENDENT;
1006     } else if (best == 1) {
1007         return FLAC_CHMODE_LEFT_SIDE;
1008     } else if (best == 2) {
1009         return FLAC_CHMODE_RIGHT_SIDE;
1010     } else {
1011         return FLAC_CHMODE_MID_SIDE;
1012     }
1013 }
1014
1015
1016 /**
1017  * Perform stereo channel decorrelation.
1018  */
1019 static void channel_decorrelation(FlacEncodeContext *ctx)
1020 {
1021     FlacFrame *frame;
1022     int32_t *left, *right;
1023     int i, n;
1024
1025     frame = &ctx->frame;
1026     n     = frame->blocksize;
1027     left  = frame->subframes[0].samples;
1028     right = frame->subframes[1].samples;
1029
1030     if (ctx->channels != 2) {
1031         frame->ch_mode = FLAC_CHMODE_INDEPENDENT;
1032         return;
1033     }
1034
1035     frame->ch_mode = estimate_stereo_mode(left, right, n);
1036
1037     /* perform decorrelation and adjust bits-per-sample */
1038     if (frame->ch_mode == FLAC_CHMODE_INDEPENDENT)
1039         return;
1040     if (frame->ch_mode == FLAC_CHMODE_MID_SIDE) {
1041         int32_t tmp;
1042         for (i = 0; i < n; i++) {
1043             tmp      = left[i];
1044             left[i]  = (tmp + right[i]) >> 1;
1045             right[i] =  tmp - right[i];
1046         }
1047         frame->subframes[1].obits++;
1048     } else if (frame->ch_mode == FLAC_CHMODE_LEFT_SIDE) {
1049         for (i = 0; i < n; i++)
1050             right[i] = left[i] - right[i];
1051         frame->subframes[1].obits++;
1052     } else {
1053         for (i = 0; i < n; i++)
1054             left[i] -= right[i];
1055         frame->subframes[0].obits++;
1056     }
1057 }
1058
1059
1060 static void write_utf8(PutBitContext *pb, uint32_t val)
1061 {
1062     uint8_t tmp;
1063     PUT_UTF8(val, tmp, put_bits(pb, 8, tmp);)
1064 }
1065
1066
1067 static void output_frame_header(FlacEncodeContext *s)
1068 {
1069     FlacFrame *frame;
1070     int crc;
1071
1072     frame = &s->frame;
1073
1074     put_bits(&s->pb, 16, 0xFFF8);
1075     put_bits(&s->pb, 4, frame->bs_code[0]);
1076     put_bits(&s->pb, 4, s->sr_code[0]);
1077
1078     if (frame->ch_mode == FLAC_CHMODE_INDEPENDENT)
1079         put_bits(&s->pb, 4, s->channels-1);
1080     else
1081         put_bits(&s->pb, 4, frame->ch_mode);
1082
1083     put_bits(&s->pb, 3, 4); /* bits-per-sample code */
1084     put_bits(&s->pb, 1, 0);
1085     write_utf8(&s->pb, s->frame_count);
1086
1087     if (frame->bs_code[0] == 6)
1088         put_bits(&s->pb, 8, frame->bs_code[1]);
1089     else if (frame->bs_code[0] == 7)
1090         put_bits(&s->pb, 16, frame->bs_code[1]);
1091
1092     if (s->sr_code[0] == 12)
1093         put_bits(&s->pb, 8, s->sr_code[1]);
1094     else if (s->sr_code[0] > 12)
1095         put_bits(&s->pb, 16, s->sr_code[1]);
1096
1097     flush_put_bits(&s->pb);
1098     crc = av_crc(av_crc_get_table(AV_CRC_8_ATM), 0, s->pb.buf,
1099                  put_bits_count(&s->pb) >> 3);
1100     put_bits(&s->pb, 8, crc);
1101 }
1102
1103
1104 static void output_subframe_constant(FlacEncodeContext *s, int ch)
1105 {
1106     FlacSubframe *sub;
1107     int32_t res;
1108
1109     sub = &s->frame.subframes[ch];
1110     res = sub->residual[0];
1111     put_sbits(&s->pb, sub->obits, res);
1112 }
1113
1114
1115 static void output_subframe_verbatim(FlacEncodeContext *s, int ch)
1116 {
1117     int i;
1118     FlacFrame *frame;
1119     FlacSubframe *sub;
1120     int32_t res;
1121
1122     frame = &s->frame;
1123     sub   = &frame->subframes[ch];
1124
1125     for (i = 0; i < frame->blocksize; i++) {
1126         res = sub->residual[i];
1127         put_sbits(&s->pb, sub->obits, res);
1128     }
1129 }
1130
1131
1132 static void output_residual(FlacEncodeContext *ctx, int ch)
1133 {
1134     int i, j, p, n, parts;
1135     int k, porder, psize, res_cnt;
1136     FlacFrame *frame;
1137     FlacSubframe *sub;
1138     int32_t *res;
1139
1140     frame = &ctx->frame;
1141     sub   = &frame->subframes[ch];
1142     res   = sub->residual;
1143     n     = frame->blocksize;
1144
1145     /* rice-encoded block */
1146     put_bits(&ctx->pb, 2, 0);
1147
1148     /* partition order */
1149     porder  = sub->rc.porder;
1150     psize   = n >> porder;
1151     parts   = (1 << porder);
1152     put_bits(&ctx->pb, 4, porder);
1153     res_cnt = psize - sub->order;
1154
1155     /* residual */
1156     j = sub->order;
1157     for (p = 0; p < parts; p++) {
1158         k = sub->rc.params[p];
1159         put_bits(&ctx->pb, 4, k);
1160         if (p == 1)
1161             res_cnt = psize;
1162         for (i = 0; i < res_cnt && j < n; i++, j++)
1163             set_sr_golomb_flac(&ctx->pb, res[j], k, INT32_MAX, 0);
1164     }
1165 }
1166
1167
1168 static void output_subframe_fixed(FlacEncodeContext *ctx, int ch)
1169 {
1170     int i;
1171     FlacFrame *frame;
1172     FlacSubframe *sub;
1173
1174     frame = &ctx->frame;
1175     sub   = &frame->subframes[ch];
1176
1177     /* warm-up samples */
1178     for (i = 0; i < sub->order; i++)
1179         put_sbits(&ctx->pb, sub->obits, sub->residual[i]);
1180
1181     /* residual */
1182     output_residual(ctx, ch);
1183 }
1184
1185
1186 static void output_subframe_lpc(FlacEncodeContext *ctx, int ch)
1187 {
1188     int i, cbits;
1189     FlacFrame *frame;
1190     FlacSubframe *sub;
1191
1192     frame = &ctx->frame;
1193     sub = &frame->subframes[ch];
1194
1195     /* warm-up samples */
1196     for (i = 0; i < sub->order; i++)
1197         put_sbits(&ctx->pb, sub->obits, sub->residual[i]);
1198
1199     /* LPC coefficients */
1200     cbits = ctx->options.lpc_coeff_precision;
1201     put_bits( &ctx->pb, 4, cbits-1);
1202     put_sbits(&ctx->pb, 5, sub->shift);
1203     for (i = 0; i < sub->order; i++)
1204         put_sbits(&ctx->pb, cbits, sub->coefs[i]);
1205
1206     /* residual */
1207     output_residual(ctx, ch);
1208 }
1209
1210
1211 static void output_subframes(FlacEncodeContext *s)
1212 {
1213     FlacFrame *frame;
1214     FlacSubframe *sub;
1215     int ch;
1216
1217     frame = &s->frame;
1218
1219     for (ch = 0; ch < s->channels; ch++) {
1220         sub = &frame->subframes[ch];
1221
1222         /* subframe header */
1223         put_bits(&s->pb, 1, 0);
1224         put_bits(&s->pb, 6, sub->type_code);
1225         put_bits(&s->pb, 1, 0); /* no wasted bits */
1226
1227         /* subframe */
1228         if(sub->type == FLAC_SUBFRAME_CONSTANT)
1229             output_subframe_constant(s, ch);
1230         else if(sub->type == FLAC_SUBFRAME_VERBATIM)
1231             output_subframe_verbatim(s, ch);
1232         else if(sub->type == FLAC_SUBFRAME_FIXED)
1233             output_subframe_fixed(s, ch);
1234         else if(sub->type == FLAC_SUBFRAME_LPC)
1235             output_subframe_lpc(s, ch);
1236     }
1237 }
1238
1239
1240 static void output_frame_footer(FlacEncodeContext *s)
1241 {
1242     int crc;
1243     flush_put_bits(&s->pb);
1244     crc = av_bswap16(av_crc(av_crc_get_table(AV_CRC_16_ANSI), 0, s->pb.buf,
1245                             put_bits_count(&s->pb)>>3));
1246     put_bits(&s->pb, 16, crc);
1247     flush_put_bits(&s->pb);
1248 }
1249
1250
1251 static void update_md5_sum(FlacEncodeContext *s, const int16_t *samples)
1252 {
1253 #if HAVE_BIGENDIAN
1254     int i;
1255     for (i = 0; i < s->frame.blocksize * s->channels; i++) {
1256         int16_t smp = av_le2ne16(samples[i]);
1257         av_md5_update(s->md5ctx, (uint8_t *)&smp, 2);
1258     }
1259 #else
1260     av_md5_update(s->md5ctx, (const uint8_t *)samples, s->frame.blocksize*s->channels*2);
1261 #endif
1262 }
1263
1264
1265 static int flac_encode_frame(AVCodecContext *avctx, uint8_t *frame,
1266                              int buf_size, void *data)
1267 {
1268     int ch;
1269     FlacEncodeContext *s;
1270     const int16_t *samples = data;
1271     int out_bytes;
1272     int reencoded=0;
1273
1274     s = avctx->priv_data;
1275
1276     if (buf_size < s->max_framesize * 2) {
1277         av_log(avctx, AV_LOG_ERROR, "output buffer too small\n");
1278         return 0;
1279     }
1280
1281     /* when the last block is reached, update the header in extradata */
1282     if (!data) {
1283         s->max_framesize = s->max_encoded_framesize;
1284         av_md5_final(s->md5ctx, s->md5sum);
1285         write_streaminfo(s, avctx->extradata);
1286         return 0;
1287     }
1288
1289     init_frame(s);
1290
1291     copy_samples(s, samples);
1292
1293     channel_decorrelation(s);
1294
1295     for (ch = 0; ch < s->channels; ch++)
1296         encode_residual(s, ch);
1297
1298 write_frame:
1299     init_put_bits(&s->pb, frame, buf_size);
1300     output_frame_header(s);
1301     output_subframes(s);
1302     output_frame_footer(s);
1303     out_bytes = put_bits_count(&s->pb) >> 3;
1304
1305     if (out_bytes > s->max_framesize) {
1306         if (reencoded) {
1307             /* still too large. must be an error. */
1308             av_log(avctx, AV_LOG_ERROR, "error encoding frame\n");
1309             return -1;
1310         }
1311
1312         /* frame too large. use verbatim mode */
1313         for (ch = 0; ch < s->channels; ch++)
1314             encode_residual_v(s, ch);
1315         reencoded = 1;
1316         goto write_frame;
1317     }
1318
1319     s->frame_count++;
1320     s->sample_count += avctx->frame_size;
1321     update_md5_sum(s, samples);
1322     if (out_bytes > s->max_encoded_framesize)
1323         s->max_encoded_framesize = out_bytes;
1324     if (out_bytes < s->min_framesize)
1325         s->min_framesize = out_bytes;
1326
1327     return out_bytes;
1328 }
1329
1330
1331 static av_cold int flac_encode_close(AVCodecContext *avctx)
1332 {
1333     if (avctx->priv_data) {
1334         FlacEncodeContext *s = avctx->priv_data;
1335         av_freep(&s->md5ctx);
1336     }
1337     av_freep(&avctx->extradata);
1338     avctx->extradata_size = 0;
1339     av_freep(&avctx->coded_frame);
1340     return 0;
1341 }
1342
1343
1344 AVCodec flac_encoder = {
1345     "flac",
1346     AVMEDIA_TYPE_AUDIO,
1347     CODEC_ID_FLAC,
1348     sizeof(FlacEncodeContext),
1349     flac_encode_init,
1350     flac_encode_frame,
1351     flac_encode_close,
1352     NULL,
1353     .capabilities = CODEC_CAP_SMALL_LAST_FRAME | CODEC_CAP_DELAY,
1354     .sample_fmts = (const enum SampleFormat[]){SAMPLE_FMT_S16,SAMPLE_FMT_NONE},
1355     .long_name = NULL_IF_CONFIG_SMALL("FLAC (Free Lossless Audio Codec)"),
1356 };