git.sesse.net Git - ffmpeg/blob - libavcodec/libmp3lame.c

   1 /*
   2  * Interface to libmp3lame for mp3 encoding
   3  * Copyright (c) 2002 Lennert Buytenhek <buytenh@gnu.org>
   4  *
   5  * This file is part of FFmpeg.
   6  *
   7  * FFmpeg is free software; you can redistribute it and/or
   8  * modify it under the terms of the GNU Lesser General Public
   9  * License as published by the Free Software Foundation; either
  10  * version 2.1 of the License, or (at your option) any later version.
  11  *
  12  * FFmpeg is distributed in the hope that it will be useful,
  13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  15  * Lesser General Public License for more details.
  16  *
  17  * You should have received a copy of the GNU Lesser General Public
  18  * License along with FFmpeg; if not, write to the Free Software
  19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  20  */
  21
  22 /**
  23  * @file
  24  * Interface to libmp3lame for mp3 encoding.
  25  */
  26
  27 #include <lame/lame.h>
  28
  29 #include "libavutil/intreadwrite.h"
  30 #include "libavutil/log.h"
  31 #include "libavutil/opt.h"
  32 #include "avcodec.h"
  33 #include "audio_frame_queue.h"
  34 #include "internal.h"
  35 #include "mpegaudio.h"
  36 #include "mpegaudiodecheader.h"
  37
  38 #define BUFFER_SIZE (7200 + 2 * MPA_FRAME_SIZE + MPA_FRAME_SIZE / 4+1000) // FIXME: Buffer size to small? Adding 1000 to make up for it.
  39
  40 typedef struct LAMEContext {
  41     AVClass *class;
  42     AVCodecContext *avctx;
  43     lame_global_flags *gfp;
  44     uint8_t buffer[BUFFER_SIZE];
  45     int buffer_index;
  46     int reservoir;
  47     void *planar_samples[2];
  48     AudioFrameQueue afq;
  49 } LAMEContext;
  50
  51
  52 static av_cold int mp3lame_encode_close(AVCodecContext *avctx)
  53 {
  54     LAMEContext *s = avctx->priv_data;
  55
  56 #if FF_API_OLD_ENCODE_AUDIO
  57     av_freep(&avctx->coded_frame);
  58 #endif
  59     av_freep(&s->planar_samples[0]);
  60     av_freep(&s->planar_samples[1]);
  61
  62     ff_af_queue_close(&s->afq);
  63
  64     lame_close(s->gfp);
  65     return 0;
  66 }
  67
  68 static av_cold int mp3lame_encode_init(AVCodecContext *avctx)
  69 {
  70     LAMEContext *s = avctx->priv_data;
  71     int ret;
  72
  73     s->avctx = avctx;
  74
  75     /* initialize LAME and get defaults */
  76     if ((s->gfp = lame_init()) == NULL)
  77         return AVERROR(ENOMEM);
  78
  79     /* channels */
  80     if (avctx->channels > 2) {
  81         av_log(avctx, AV_LOG_ERROR,
  82                "Invalid number of channels %d, must be <= 2\n", avctx->channels);
  83         ret =  AVERROR(EINVAL);
  84         goto error;
  85     }
  86     lame_set_num_channels(s->gfp, avctx->channels);
  87     lame_set_mode(s->gfp, avctx->channels > 1 ? JOINT_STEREO : MONO);
  88
  89     /* sample rate */
  90     lame_set_in_samplerate (s->gfp, avctx->sample_rate);
  91     lame_set_out_samplerate(s->gfp, avctx->sample_rate);
  92
  93     /* algorithmic quality */
  94     if (avctx->compression_level == FF_COMPRESSION_DEFAULT)
  95         lame_set_quality(s->gfp, 5);
  96     else
  97         lame_set_quality(s->gfp, avctx->compression_level);
  98
  99     /* rate control */
 100     if (avctx->flags & CODEC_FLAG_QSCALE) {
 101         lame_set_VBR(s->gfp, vbr_default);
 102         lame_set_VBR_quality(s->gfp, avctx->global_quality / (float)FF_QP2LAMBDA);
 103     } else {
 104         if (avctx->bit_rate)
 105             lame_set_brate(s->gfp, avctx->bit_rate / 1000);
 106     }
 107
 108     /* do not get a Xing VBR header frame from LAME */
 109     lame_set_bWriteVbrTag(s->gfp,0);
 110
 111     /* bit reservoir usage */
 112     lame_set_disable_reservoir(s->gfp, !s->reservoir);
 113
 114     /* set specified parameters */
 115     if (lame_init_params(s->gfp) < 0) {
 116         ret = -1;
 117         goto error;
 118     }
 119
 120     /* get encoder delay */
 121     avctx->delay = lame_get_encoder_delay(s->gfp) + 528 + 1;
 122     ff_af_queue_init(avctx, &s->afq);
 123
 124     avctx->frame_size  = lame_get_framesize(s->gfp);
 125
 126 #if FF_API_OLD_ENCODE_AUDIO
 127     avctx->coded_frame = avcodec_alloc_frame();
 128     if (!avctx->coded_frame) {
 129         ret = AVERROR(ENOMEM);
 130         goto error;
 131     }
 132 #endif
 133
 134     /* sample format */
 135     if (avctx->sample_fmt == AV_SAMPLE_FMT_S32 ||
 136         avctx->sample_fmt == AV_SAMPLE_FMT_FLT) {
 137         int ch;
 138         for (ch = 0; ch < avctx->channels; ch++) {
 139             s->planar_samples[ch] = av_malloc(avctx->frame_size *
 140                                               av_get_bytes_per_sample(avctx->sample_fmt));
 141             if (!s->planar_samples[ch]) {
 142                 ret = AVERROR(ENOMEM);
 143                 goto error;
 144             }
 145         }
 146     }
 147
 148     return 0;
 149 error:
 150     mp3lame_encode_close(avctx);
 151     return ret;
 152 }
 153
 154 #define DEINTERLEAVE(type, scale) do {                  \
 155     int ch, i;                                          \
 156     for (ch = 0; ch < s->avctx->channels; ch++) {       \
 157         const type *input = samples;                    \
 158         type      *output = s->planar_samples[ch];      \
 159         input += ch;                                    \
 160         for (i = 0; i < nb_samples; i++) {              \
 161             output[i] = *input * scale;                 \
 162             input += s->avctx->channels;                \
 163         }                                               \
 164     }                                                   \
 165 } while (0)
 166
 167 static int encode_frame_int16(LAMEContext *s, void *samples, int nb_samples)
 168 {
 169     if (s->avctx->channels > 1) {
 170         return lame_encode_buffer_interleaved(s->gfp, samples,
 171                                               nb_samples,
 172                                               s->buffer + s->buffer_index,
 173                                               BUFFER_SIZE - s->buffer_index);
 174     } else {
 175         return lame_encode_buffer(s->gfp, samples, NULL, nb_samples,
 176                                   s->buffer + s->buffer_index,
 177                                   BUFFER_SIZE - s->buffer_index);
 178     }
 179 }
 180
 181 static int encode_frame_int32(LAMEContext *s, void *samples, int nb_samples)
 182 {
 183     DEINTERLEAVE(int32_t, 1);
 184
 185     return lame_encode_buffer_int(s->gfp,
 186                                   s->planar_samples[0], s->planar_samples[1],
 187                                   nb_samples,
 188                                   s->buffer + s->buffer_index,
 189                                   BUFFER_SIZE - s->buffer_index);
 190 }
 191
 192 static int encode_frame_float(LAMEContext *s, void *samples, int nb_samples)
 193 {
 194     DEINTERLEAVE(float, 32768.0f);
 195
 196     return lame_encode_buffer_float(s->gfp,
 197                                     s->planar_samples[0], s->planar_samples[1],
 198                                     nb_samples,
 199                                     s->buffer + s->buffer_index,
 200                                     BUFFER_SIZE - s->buffer_index);
 201 }
 202
 203 static int mp3lame_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
 204                                 const AVFrame *frame, int *got_packet_ptr)
 205 {
 206     LAMEContext *s = avctx->priv_data;
 207     MPADecodeHeader hdr;
 208     int len, ret;
 209     int lame_result;
 210
 211     if (frame) {
 212         switch (avctx->sample_fmt) {
 213         case AV_SAMPLE_FMT_S16:
 214             lame_result = encode_frame_int16(s, frame->data[0], frame->nb_samples);
 215             break;
 216         case AV_SAMPLE_FMT_S32:
 217             lame_result = encode_frame_int32(s, frame->data[0], frame->nb_samples);
 218             break;
 219         case AV_SAMPLE_FMT_FLT:
 220             lame_result = encode_frame_float(s, frame->data[0], frame->nb_samples);
 221             break;
 222         default:
 223             return AVERROR_BUG;
 224         }
 225     } else {
 226         lame_result = lame_encode_flush(s->gfp, s->buffer + s->buffer_index,
 227                                         BUFFER_SIZE - s->buffer_index);
 228     }
 229     if (lame_result < 0) {
 230         if (lame_result == -1) {
 231             av_log(avctx, AV_LOG_ERROR,
 232                    "lame: output buffer too small (buffer index: %d, free bytes: %d)\n",
 233                    s->buffer_index, BUFFER_SIZE - s->buffer_index);
 234         }
 235         return -1;
 236     }
 237     s->buffer_index += lame_result;
 238
 239     /* add current frame to the queue */
 240     if (frame) {
 241         if ((ret = ff_af_queue_add(&s->afq, frame) < 0))
 242             return ret;
 243     }
 244
 245     /* Move 1 frame from the LAME buffer to the output packet, if available.
 246        We have to parse the first frame header in the output buffer to
 247        determine the frame size. */
 248     if (s->buffer_index < 4)
 249         return 0;
 250     if (avpriv_mpegaudio_decode_header(&hdr, AV_RB32(s->buffer))) {
 251         av_log(avctx, AV_LOG_ERROR, "free format output not supported\n");
 252         return -1;
 253     }
 254     len = hdr.frame_size;
 255     av_dlog(avctx, "in:%d packet-len:%d index:%d\n", avctx->frame_size, len,
 256             s->buffer_index);
 257     if (len <= s->buffer_index) {
 258         if ((ret = ff_alloc_packet2(avctx, avpkt, len))) {
 259             return ret;
 260         }
 261         memcpy(avpkt->data, s->buffer, len);
 262         s->buffer_index -= len;
 263         memmove(s->buffer, s->buffer + len, s->buffer_index);
 264
 265         /* Get the next frame pts/duration */
 266         ff_af_queue_remove(&s->afq, avctx->frame_size, &avpkt->pts,
 267                            &avpkt->duration);
 268
 269         avpkt->size = len;
 270         *got_packet_ptr = 1;
 271     }
 272     return 0;
 273 }
 274
 275 #define OFFSET(x) offsetof(LAMEContext, x)
 276 #define AE AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
 277 static const AVOption options[] = {
 278     { "reservoir", "Use bit reservoir.", OFFSET(reservoir), AV_OPT_TYPE_INT, { 1 }, 0, 1, AE },
 279     { NULL },
 280 };
 281
 282 static const AVClass libmp3lame_class = {
 283     .class_name = "libmp3lame encoder",
 284     .item_name  = av_default_item_name,
 285     .option     = options,
 286     .version    = LIBAVUTIL_VERSION_INT,
 287 };
 288
 289 static const AVCodecDefault libmp3lame_defaults[] = {
 290     { "b",          "0" },
 291     { NULL },
 292 };
 293
 294 static const int libmp3lame_sample_rates[] = {
 295     44100, 48000,  32000, 22050, 24000, 16000, 11025, 12000, 8000, 0
 296 };
 297
 298 AVCodec ff_libmp3lame_encoder = {
 299     .name                  = "libmp3lame",
 300     .type                  = AVMEDIA_TYPE_AUDIO,
 301     .id                    = CODEC_ID_MP3,
 302     .priv_data_size        = sizeof(LAMEContext),
 303     .init                  = mp3lame_encode_init,
 304     .encode2               = mp3lame_encode_frame,
 305     .close                 = mp3lame_encode_close,
 306     .capabilities          = CODEC_CAP_DELAY | CODEC_CAP_SMALL_LAST_FRAME,
 307     .sample_fmts           = (const enum AVSampleFormat[]) { AV_SAMPLE_FMT_S32,
 308                                                              AV_SAMPLE_FMT_FLT,
 309                                                              AV_SAMPLE_FMT_S16,
 310                                                              AV_SAMPLE_FMT_NONE },
 311     .supported_samplerates = libmp3lame_sample_rates,
 312     .long_name             = NULL_IF_CONFIG_SMALL("libmp3lame MP3 (MPEG audio layer 3)"),
 313     .priv_class            = &libmp3lame_class,
 314     .defaults              = libmp3lame_defaults,
 315 };