1 /*****************************************************************************
2 * audio.c: audio decoder using ffmpeg library
3 *****************************************************************************
4 * Copyright (C) 1999-2003 the VideoLAN team
7 * Authors: Laurent Aimar <fenrir@via.ecp.fr>
8 * Gildas Bazin <gbazin@videolan.org>
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published by
12 * the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
15 * This program is distributed in the hope that it will be useful,
16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 * GNU General Public License for more details.
20 * You should have received a copy of the GNU General Public License
21 * along with this program; if not, write to the Free Software
22 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
23 *****************************************************************************/
25 /*****************************************************************************
27 *****************************************************************************/
32 #include <vlc_common.h>
34 #include <vlc_codec.h>
35 #include <vlc_avcodec.h>
38 #ifdef HAVE_LIBAVCODEC_AVCODEC_H
39 # include <libavcodec/avcodec.h>
40 #elif defined(HAVE_FFMPEG_AVCODEC_H)
41 # include <ffmpeg/avcodec.h>
48 /*****************************************************************************
49 * decoder_sys_t : decoder descriptor
50 *****************************************************************************/
55 /* Temporary buffer for libavcodec */
62 audio_sample_format_t aout_format;
63 audio_date_t end_date;
76 int pi_extraction[AOUT_CHAN_MAX];
77 int i_previous_channels;
78 int64_t i_previous_layout;
81 static void SetupOutputFormat( decoder_t *p_dec );
83 /*****************************************************************************
84 * InitAudioDec: initialize audio decoder
85 *****************************************************************************
86 * The ffmpeg codec will be opened, some memory allocated.
87 *****************************************************************************/
88 int InitAudioDec( decoder_t *p_dec, AVCodecContext *p_context,
89 AVCodec *p_codec, int i_codec_id, const char *psz_namecodec )
93 /* Allocate the memory needed to store the decoder's structure */
94 if( ( p_dec->p_sys = p_sys = malloc(sizeof(*p_sys)) ) == NULL )
99 p_sys->p_context = p_context;
100 p_sys->p_codec = p_codec;
101 p_sys->i_codec_id = i_codec_id;
102 p_sys->psz_namecodec = psz_namecodec;
103 p_sys->b_delayed_open = false;
105 /* ***** Fill p_context with init values ***** */
106 p_sys->p_context->sample_rate = p_dec->fmt_in.audio.i_rate;
107 p_sys->p_context->channels = p_dec->fmt_in.audio.i_channels;
109 p_sys->p_context->block_align = p_dec->fmt_in.audio.i_blockalign;
110 p_sys->p_context->bit_rate = p_dec->fmt_in.i_bitrate;
111 #if LIBAVCODEC_VERSION_INT < ((52<<16)+(0<<8)+0)
112 p_sys->p_context->bits_per_sample = p_dec->fmt_in.audio.i_bitspersample;
114 p_sys->p_context->bits_per_coded_sample = p_dec->fmt_in.audio.i_bitspersample;
117 if( p_dec->fmt_in.i_extra > 0 )
119 const uint8_t * const p_src = p_dec->fmt_in.p_extra;
123 if( p_dec->fmt_in.i_codec == VLC_FOURCC( 'f', 'l', 'a', 'c' ) )
126 i_size = p_dec->fmt_in.i_extra - 8;
128 else if( p_dec->fmt_in.i_codec == VLC_FOURCC( 'a', 'l', 'a', 'c' ) )
130 static const uint8_t p_pattern[] = { 0, 0, 0, 36, 'a', 'l', 'a', 'c' };
131 /* Find alac atom XXX it is a bit ugly */
132 for( i_offset = 0; i_offset < p_dec->fmt_in.i_extra - sizeof(p_pattern); i_offset++ )
134 if( !memcmp( &p_src[i_offset], p_pattern, sizeof(p_pattern) ) )
137 i_size = __MIN( p_dec->fmt_in.i_extra - i_offset, 36 );
144 i_size = p_dec->fmt_in.i_extra;
149 p_sys->p_context->extradata =
150 malloc( i_size + FF_INPUT_BUFFER_PADDING_SIZE );
151 if( p_sys->p_context->extradata )
153 uint8_t *p_dst = p_sys->p_context->extradata;
155 p_sys->p_context->extradata_size = i_size;
157 memcpy( &p_dst[0], &p_src[i_offset], i_size );
158 memset( &p_dst[i_size], 0, FF_INPUT_BUFFER_PADDING_SIZE );
164 p_sys->p_context->extradata_size = 0;
165 p_sys->p_context->extradata = NULL;
168 /* ***** Open the codec ***** */
171 ret = avcodec_open( p_sys->p_context, p_sys->p_codec );
172 vlc_avcodec_unlock();
175 msg_Err( p_dec, "cannot open codec (%s)", p_sys->psz_namecodec );
176 free( p_sys->p_context->extradata );
181 msg_Dbg( p_dec, "ffmpeg codec (%s) started", p_sys->psz_namecodec );
185 #if LIBAVCODEC_VERSION_INT >= AV_VERSION_INT( 51, 16, 0 )
186 case CODEC_ID_WAVPACK:
187 p_sys->i_output_max = 8 * sizeof(int32_t) * 131072;
191 p_sys->i_output_max = 8 * sizeof(int32_t) * 65535;
194 p_sys->i_output_max = 0;
197 if( p_sys->i_output_max < AVCODEC_MAX_AUDIO_FRAME_SIZE )
198 p_sys->i_output_max = AVCODEC_MAX_AUDIO_FRAME_SIZE;
199 msg_Dbg( p_dec, "Using %d bytes output buffer", p_sys->i_output_max );
200 p_sys->p_output = malloc( p_sys->i_output_max );
202 p_sys->p_samples = NULL;
203 p_sys->i_samples = 0;
204 p_sys->i_reject_count = 0;
205 p_sys->b_extract = false;
206 p_sys->i_previous_channels = 0;
207 p_sys->i_previous_layout = 0;
209 aout_DateSet( &p_sys->end_date, 0 );
210 if( p_dec->fmt_in.audio.i_rate )
211 aout_DateInit( &p_sys->end_date, p_dec->fmt_in.audio.i_rate );
214 es_format_Init( &p_dec->fmt_out, AUDIO_ES, 0 );
219 /*****************************************************************************
220 * SplitBuffer: Needed because aout really doesn't like big audio chunk and
221 * wma produces easily > 30000 samples...
222 *****************************************************************************/
223 static aout_buffer_t *SplitBuffer( decoder_t *p_dec )
225 decoder_sys_t *p_sys = p_dec->p_sys;
226 int i_samples = __MIN( p_sys->i_samples, 4096 );
227 aout_buffer_t *p_buffer;
229 if( i_samples == 0 ) return NULL;
231 if( ( p_buffer = decoder_NewAudioBuffer( p_dec, i_samples ) ) == NULL )
234 p_buffer->start_date = aout_DateGet( &p_sys->end_date );
235 p_buffer->end_date = aout_DateIncrement( &p_sys->end_date, i_samples );
237 if( p_sys->b_extract )
238 aout_ChannelExtract( p_buffer->p_buffer, p_dec->fmt_out.audio.i_channels,
239 p_sys->p_samples, p_sys->p_context->channels, i_samples,
240 p_sys->pi_extraction, p_dec->fmt_out.audio.i_bitspersample );
242 memcpy( p_buffer->p_buffer, p_sys->p_samples, p_buffer->i_nb_bytes );
244 p_sys->p_samples += p_buffer->i_nb_bytes;
245 p_sys->i_samples -= i_samples;
250 /*****************************************************************************
251 * DecodeAudio: Called to decode one frame
252 *****************************************************************************/
253 aout_buffer_t * DecodeAudio ( decoder_t *p_dec, block_t **pp_block )
255 decoder_sys_t *p_sys = p_dec->p_sys;
256 int i_used, i_output;
257 aout_buffer_t *p_buffer;
260 if( !pp_block || !*pp_block ) return NULL;
264 if( p_block->i_flags & (BLOCK_FLAG_DISCONTINUITY|BLOCK_FLAG_CORRUPTED) )
266 block_Release( p_block );
267 avcodec_flush_buffers( p_sys->p_context );
268 p_sys->i_samples = 0;
269 aout_DateSet( &p_sys->end_date, 0 );
271 if( p_sys->i_codec_id == CODEC_ID_MP2 || p_sys->i_codec_id == CODEC_ID_MP3 )
272 p_sys->i_reject_count = 3;
276 if( p_sys->i_samples > 0 )
279 p_buffer = SplitBuffer( p_dec );
280 if( !p_buffer ) block_Release( p_block );
284 if( !aout_DateGet( &p_sys->end_date ) && !p_block->i_pts )
286 /* We've just started the stream, wait for the first PTS. */
287 block_Release( p_block );
291 if( p_block->i_buffer <= 0 )
293 block_Release( p_block );
297 i_output = __MAX( p_block->i_buffer, p_sys->i_output_max );
298 if( i_output < p_sys->i_output_max )
300 /* Grow output buffer if necessary (eg. for PCM data) */
301 p_sys->p_output = realloc(p_sys->p_output, p_block->i_buffer);
304 *pp_block = p_block = block_Realloc( p_block, 0, p_block->i_buffer + FF_INPUT_BUFFER_PADDING_SIZE );
307 p_block->i_buffer -= FF_INPUT_BUFFER_PADDING_SIZE;
308 memset( &p_block->p_buffer[p_block->i_buffer], 0, FF_INPUT_BUFFER_PADDING_SIZE );
310 #if LIBAVCODEC_VERSION_INT >= ((52<<16)+(0<<8)+0)
311 i_used = avcodec_decode_audio2( p_sys->p_context,
312 (int16_t*)p_sys->p_output, &i_output,
313 p_block->p_buffer, p_block->i_buffer );
315 i_used = avcodec_decode_audio( p_sys->p_context,
316 (int16_t*)p_sys->p_output, &i_output,
317 p_block->p_buffer, p_block->i_buffer );
320 if( i_used < 0 || i_output < 0 )
323 msg_Warn( p_dec, "cannot decode one frame (%zu bytes)",
326 block_Release( p_block );
329 else if( (size_t)i_used > p_block->i_buffer )
331 i_used = p_block->i_buffer;
334 p_block->i_buffer -= i_used;
335 p_block->p_buffer += i_used;
337 if( p_sys->p_context->channels <= 0 || p_sys->p_context->channels > 8 ||
338 p_sys->p_context->sample_rate <= 0 )
340 msg_Warn( p_dec, "invalid audio properties channels count %d, sample rate %d",
341 p_sys->p_context->channels, p_sys->p_context->sample_rate );
342 block_Release( p_block );
346 if( p_dec->fmt_out.audio.i_rate != (unsigned int)p_sys->p_context->sample_rate )
348 aout_DateInit( &p_sys->end_date, p_sys->p_context->sample_rate );
349 aout_DateSet( &p_sys->end_date, p_block->i_pts );
352 /* **** Set audio output parameters **** */
353 SetupOutputFormat( p_dec );
355 if( p_block->i_pts != 0 &&
356 p_block->i_pts != aout_DateGet( &p_sys->end_date ) )
358 aout_DateSet( &p_sys->end_date, p_block->i_pts );
362 /* **** Now we can output these samples **** */
363 p_sys->i_samples = i_output / (p_dec->fmt_out.audio.i_bitspersample / 8) / p_sys->p_context->channels;
364 p_sys->p_samples = p_sys->p_output;
366 /* Silent unwanted samples */
367 if( p_sys->i_reject_count > 0 )
369 memset( p_sys->p_output, 0, i_output );
370 p_sys->i_reject_count--;
373 p_buffer = SplitBuffer( p_dec );
374 if( !p_buffer ) block_Release( p_block );
378 /*****************************************************************************
379 * EndAudioDec: audio decoder destruction
380 *****************************************************************************/
381 void EndAudioDec( decoder_t *p_dec )
383 decoder_sys_t *p_sys = p_dec->p_sys;
385 free( p_sys->p_output );
388 /*****************************************************************************
390 *****************************************************************************/
391 static const uint64_t pi_channels_map[][2] =
393 { CH_FRONT_LEFT, AOUT_CHAN_LEFT },
394 { CH_FRONT_RIGHT, AOUT_CHAN_RIGHT },
395 { CH_FRONT_CENTER, AOUT_CHAN_CENTER },
396 { CH_LOW_FREQUENCY, AOUT_CHAN_LFE },
397 { CH_BACK_LEFT, AOUT_CHAN_REARLEFT },
398 { CH_BACK_RIGHT, AOUT_CHAN_REARRIGHT },
399 { CH_FRONT_LEFT_OF_CENTER, 0 },
400 { CH_FRONT_RIGHT_OF_CENTER, 0 },
401 { CH_BACK_CENTER, AOUT_CHAN_REARCENTER },
402 { CH_SIDE_LEFT, AOUT_CHAN_MIDDLELEFT },
403 { CH_SIDE_RIGHT, AOUT_CHAN_MIDDLERIGHT },
404 { CH_TOP_CENTER, 0 },
405 { CH_TOP_FRONT_LEFT, 0 },
406 { CH_TOP_FRONT_CENTER, 0 },
407 { CH_TOP_FRONT_RIGHT, 0 },
408 { CH_TOP_BACK_LEFT, 0 },
409 { CH_TOP_BACK_CENTER, 0 },
410 { CH_TOP_BACK_RIGHT, 0 },
411 { CH_STEREO_LEFT, 0 },
412 { CH_STEREO_RIGHT, 0 },
415 static void SetupOutputFormat( decoder_t *p_dec )
417 decoder_sys_t *p_sys = p_dec->p_sys;
419 #if defined(AV_VERSION_INT) && LIBAVCODEC_VERSION_INT >= AV_VERSION_INT( 51, 65, 0 )
420 switch( p_sys->p_context->sample_fmt )
423 p_dec->fmt_out.i_codec = VLC_FOURCC('u','8',' ',' ');
424 p_dec->fmt_out.audio.i_bitspersample = 8;
427 p_dec->fmt_out.i_codec = AOUT_FMT_S32_NE;
428 p_dec->fmt_out.audio.i_bitspersample = 32;
431 p_dec->fmt_out.i_codec = VLC_FOURCC('f','l','3','2');
432 p_dec->fmt_out.audio.i_bitspersample = 32;
435 p_dec->fmt_out.i_codec = VLC_FOURCC('f','l','6','4');
436 p_dec->fmt_out.audio.i_bitspersample = 64;
441 p_dec->fmt_out.i_codec = AOUT_FMT_S16_NE;
442 p_dec->fmt_out.audio.i_bitspersample = 16;
446 p_dec->fmt_out.i_codec = AOUT_FMT_S16_NE;
447 p_dec->fmt_out.audio.i_bitspersample = 16;
449 p_dec->fmt_out.audio.i_rate = p_sys->p_context->sample_rate;
450 p_dec->fmt_out.audio.i_channels = p_sys->p_context->channels;
453 if( p_sys->i_previous_channels == p_sys->p_context->channels &&
454 p_sys->i_previous_layout == p_sys->p_context->channel_layout )
456 p_sys->i_previous_channels = p_sys->p_context->channels;
457 p_sys->i_previous_layout = p_sys->p_context->channel_layout;
460 * FIXME should we use fmt_in.audio.i_physical_channels or not ?
462 const unsigned i_order_max = 8 * sizeof(p_sys->p_context->channel_layout);
463 uint32_t pi_order_src[i_order_max];
464 int i_channels_src = 0;
466 if( p_sys->p_context->channel_layout )
468 for( unsigned i = 0; i < sizeof(pi_channels_map)/sizeof(*pi_channels_map); i++ )
470 if( p_sys->p_context->channel_layout & pi_channels_map[i][0] )
471 pi_order_src[i_channels_src++] = pi_channels_map[i][1];
476 /* Create default order */
477 msg_Warn( p_dec, "Physical channel configuration not set : guessing" );
478 for( unsigned int i = 0; i < __MIN( i_order_max, (unsigned)p_sys->p_context->channels ); i++ )
480 if( i < sizeof(pi_channels_map)/sizeof(*pi_channels_map) )
481 pi_order_src[i_channels_src++] = pi_channels_map[i][1];
484 if( i_channels_src != p_sys->p_context->channels )
485 msg_Err( p_dec, "Channel layout not understood" );
487 uint32_t i_layout_dst;
489 p_sys->b_extract = aout_CheckChannelExtraction( p_sys->pi_extraction,
490 &i_layout_dst, &i_channels_dst,
491 NULL, pi_order_src, i_channels_src );
492 if( i_channels_dst != i_channels_src )
493 msg_Warn( p_dec, "%d channels are dropped", i_channels_src - i_channels_dst );
495 p_dec->fmt_out.audio.i_physical_channels =
496 p_dec->fmt_out.audio.i_original_channels = i_layout_dst;
497 p_dec->fmt_out.audio.i_channels = i_channels_dst;