1 /*****************************************************************************
2 * audio.c: transcoding stream output module (audio)
3 *****************************************************************************
4 * Copyright (C) 2003-2009 the VideoLAN team
7 * Authors: Laurent Aimar <fenrir@via.ecp.fr>
8 * Gildas Bazin <gbazin@videolan.org>
9 * Jean-Paul Saman <jpsaman #_at_# m2x dot nl>
10 * Antoine Cellerier <dionoea at videolan dot org>
12 * This program is free software; you can redistribute it and/or modify
13 * it under the terms of the GNU General Public License as published by
14 * the Free Software Foundation; either version 2 of the License, or
15 * (at your option) any later version.
17 * This program is distributed in the hope that it will be useful,
18 * but WITHOUT ANY WARRANTY; without even the implied warranty of
19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20 * GNU General Public License for more details.
22 * You should have received a copy of the GNU General Public License
23 * along with this program; if not, write to the Free Software
24 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
25 *****************************************************************************/
27 /*****************************************************************************
29 *****************************************************************************/
31 #include "transcode.h"
35 #include <vlc_modules.h>
37 static const int pi_channels_maps[6] =
40 AOUT_CHAN_CENTER, AOUT_CHAN_LEFT | AOUT_CHAN_RIGHT,
41 AOUT_CHAN_CENTER | AOUT_CHAN_LEFT | AOUT_CHAN_RIGHT,
42 AOUT_CHAN_LEFT | AOUT_CHAN_RIGHT | AOUT_CHAN_REARLEFT
43 | AOUT_CHAN_REARRIGHT,
44 AOUT_CHAN_LEFT | AOUT_CHAN_RIGHT | AOUT_CHAN_CENTER
45 | AOUT_CHAN_REARLEFT | AOUT_CHAN_REARRIGHT
48 static block_t *audio_new_buffer( decoder_t *p_dec, int i_samples )
53 if( p_dec->fmt_out.audio.i_bitspersample )
55 i_size = i_samples * p_dec->fmt_out.audio.i_bitspersample / 8 *
56 p_dec->fmt_out.audio.i_channels;
58 else if( p_dec->fmt_out.audio.i_bytes_per_frame &&
59 p_dec->fmt_out.audio.i_frame_length )
61 i_size = i_samples * p_dec->fmt_out.audio.i_bytes_per_frame /
62 p_dec->fmt_out.audio.i_frame_length;
66 i_size = i_samples * 4 * p_dec->fmt_out.audio.i_channels;
69 p_block = block_Alloc( i_size );
70 p_block->i_nb_samples = i_samples;
74 static int transcode_audio_filter_allocation_init( filter_t *p_filter,
82 static bool transcode_audio_filter_needed( const es_format_t *p_fmt1, const es_format_t *p_fmt2 )
84 if( p_fmt1->i_codec != p_fmt2->i_codec ||
85 p_fmt1->audio.i_channels != p_fmt2->audio.i_channels ||
86 p_fmt1->audio.i_rate != p_fmt2->audio.i_rate )
90 static int transcode_audio_filter_chain_build( sout_stream_t *p_stream, filter_chain_t *p_chain,
91 const es_format_t *p_dst, const es_format_t *p_src )
93 if( !transcode_audio_filter_needed( p_dst, p_src ) )
96 es_format_t current = *p_src;
98 msg_Dbg( p_stream, "Looking for filter "
99 "(%4.4s->%4.4s, channels %d->%d, rate %d->%d)",
100 (const char *)&p_src->i_codec,
101 (const char *)&p_dst->i_codec,
102 p_src->audio.i_channels,
103 p_dst->audio.i_channels,
105 p_dst->audio.i_rate );
107 /* If any filter is needed, convert to fl32 */
108 if( current.i_codec != VLC_CODEC_FL32 )
110 /* First step, convert to fl32 */
112 current.audio.i_format = VLC_CODEC_FL32;
113 aout_FormatPrepare( ¤t.audio );
115 if( !filter_chain_AppendFilter( p_chain, NULL, NULL, NULL, ¤t ) )
117 msg_Err( p_stream, "Failed to find conversion filter to floating point" );
120 current = *filter_chain_GetFmtOut( p_chain );
123 /* Fix sample rate */
124 if( current.audio.i_rate != p_dst->audio.i_rate )
126 current.audio.i_rate = p_dst->audio.i_rate;
127 aout_FormatPrepare( ¤t.audio );
128 if( !filter_chain_AppendFilter( p_chain, NULL, NULL, NULL, ¤t ) )
130 msg_Err( p_stream, "Failed to find conversion filter for resampling" );
133 current = *filter_chain_GetFmtOut( p_chain );
137 if( current.audio.i_channels != p_dst->audio.i_channels )
139 current.audio.i_channels = p_dst->audio.i_channels;
140 current.audio.i_physical_channels = p_dst->audio.i_physical_channels;
141 current.audio.i_original_channels = p_dst->audio.i_original_channels;
143 if( ( !current.audio.i_physical_channels || !current.audio.i_original_channels ) &&
144 current.audio.i_channels < 6 )
145 current.audio.i_physical_channels =
146 current.audio.i_original_channels = pi_channels_maps[current.audio.i_channels];
148 aout_FormatPrepare( ¤t.audio );
149 if( !filter_chain_AppendFilter( p_chain, NULL, NULL, NULL, ¤t ) )
151 msg_Err( p_stream, "Failed to find conversion filter for channel mixing" );
154 current = *filter_chain_GetFmtOut( p_chain );
156 /* And last step, convert to the requested codec */
157 if( current.i_codec != p_dst->i_codec )
159 current.i_codec = p_dst->i_codec;
160 aout_FormatPrepare( ¤t.audio );
161 if( !filter_chain_AppendFilter( p_chain, NULL, NULL, NULL, ¤t ) )
163 msg_Err( p_stream, "Failed to find conversion filter to %4.4s",
164 (const char*)&p_dst->i_codec);
167 current = *filter_chain_GetFmtOut( p_chain );
170 if( transcode_audio_filter_needed( p_dst, ¤t ) )
172 /* Weird case, a filter has side effects, doomed */
173 msg_Err( p_stream, "Failed to create a valid audio filter chain" );
177 msg_Dbg( p_stream, "Got complete audio filter chain" );
182 int transcode_audio_new( sout_stream_t *p_stream,
183 sout_stream_id_t *id )
185 sout_stream_sys_t *p_sys = p_stream->p_sys;
186 es_format_t fmt_last;
192 /* Initialization of decoder structures */
193 id->p_decoder->fmt_out = id->p_decoder->fmt_in;
194 id->p_decoder->fmt_out.i_extra = 0;
195 id->p_decoder->fmt_out.p_extra = 0;
196 id->p_decoder->pf_decode_audio = NULL;
197 id->p_decoder->pf_aout_buffer_new = audio_new_buffer;
198 /* id->p_decoder->p_cfg = p_sys->p_audio_cfg; */
200 id->p_decoder->p_module =
201 module_need( id->p_decoder, "decoder", "$codec", false );
202 if( !id->p_decoder->p_module )
204 msg_Err( p_stream, "cannot find audio decoder" );
207 /* decoders don't set audio.i_format, but audio filters use it */
208 id->p_decoder->fmt_out.audio.i_format = id->p_decoder->fmt_out.i_codec;
209 id->p_decoder->fmt_out.audio.i_bitspersample =
210 aout_BitsPerSample( id->p_decoder->fmt_out.i_codec );
211 fmt_last = id->p_decoder->fmt_out;
212 /* Fix AAC SBR changing number of channels and sampling rate */
213 if( !(id->p_decoder->fmt_in.i_codec == VLC_CODEC_MP4A &&
214 fmt_last.audio.i_rate != id->p_encoder->fmt_in.audio.i_rate &&
215 fmt_last.audio.i_channels != id->p_encoder->fmt_in.audio.i_channels) )
216 fmt_last.audio.i_rate = id->p_decoder->fmt_in.audio.i_rate;
222 /* Initialization of encoder format structures */
223 es_format_Init( &id->p_encoder->fmt_in, id->p_decoder->fmt_in.i_cat,
224 id->p_decoder->fmt_out.i_codec );
225 id->p_encoder->fmt_in.audio.i_format = id->p_decoder->fmt_out.i_codec;
227 id->p_encoder->fmt_in.audio.i_rate = id->p_encoder->fmt_out.audio.i_rate;
228 id->p_encoder->fmt_in.audio.i_physical_channels =
229 id->p_encoder->fmt_out.audio.i_physical_channels;
230 id->p_encoder->fmt_in.audio.i_original_channels =
231 id->p_encoder->fmt_out.audio.i_original_channels;
232 id->p_encoder->fmt_in.audio.i_channels =
233 id->p_encoder->fmt_out.audio.i_channels;
234 id->p_encoder->fmt_in.audio.i_bitspersample =
235 aout_BitsPerSample( id->p_encoder->fmt_in.i_codec );
237 id->p_encoder->p_cfg = p_stream->p_sys->p_audio_cfg;
238 id->p_encoder->p_module =
239 module_need( id->p_encoder, "encoder", p_sys->psz_aenc, true );
240 if( !id->p_encoder->p_module )
242 msg_Err( p_stream, "cannot find audio encoder (module:%s fourcc:%4.4s). Take a look few lines earlier to see possible reason.",
243 p_sys->psz_aenc ? p_sys->psz_aenc : "any",
244 (char *)&p_sys->i_acodec );
245 module_unneed( id->p_decoder, id->p_decoder->p_module );
246 id->p_decoder->p_module = NULL;
249 id->p_encoder->fmt_in.audio.i_format = id->p_encoder->fmt_in.i_codec;
250 id->p_encoder->fmt_in.audio.i_bitspersample =
251 aout_BitsPerSample( id->p_encoder->fmt_in.i_codec );
253 /* Load user specified audio filters */
256 es_format_t fmt_fl32 = fmt_last;
258 fmt_fl32.audio.i_format = VLC_CODEC_FL32;
259 id->p_uf_chain = filter_chain_New( p_stream, "audio filter", false,
260 transcode_audio_filter_allocation_init, NULL, NULL );
261 filter_chain_Reset( id->p_uf_chain, &fmt_last, &fmt_fl32 );
263 if( transcode_audio_filter_chain_build( p_stream, id->p_uf_chain,
264 &fmt_fl32, &fmt_last ) )
266 transcode_audio_close( id );
271 if( filter_chain_AppendFromString( id->p_uf_chain, p_sys->psz_af ) > 0 )
272 fmt_last = *filter_chain_GetFmtOut( id->p_uf_chain );
275 /* Load conversion filters */
276 id->p_f_chain = filter_chain_New( p_stream, "audio converter", true,
277 transcode_audio_filter_allocation_init, NULL, NULL );
278 filter_chain_Reset( id->p_f_chain, &fmt_last, &id->p_encoder->fmt_in );
280 if( transcode_audio_filter_chain_build( p_stream, id->p_f_chain,
281 &id->p_encoder->fmt_in, &fmt_last ) )
283 transcode_audio_close( id );
286 fmt_last = id->p_encoder->fmt_in;
289 id->p_encoder->fmt_out.i_codec =
290 vlc_fourcc_GetCodec( AUDIO_ES, id->p_encoder->fmt_out.i_codec );
295 void transcode_audio_close( sout_stream_id_t *id )
298 if( id->p_decoder->p_module )
299 module_unneed( id->p_decoder, id->p_decoder->p_module );
300 id->p_decoder->p_module = NULL;
302 if( id->p_decoder->p_description )
303 vlc_meta_Delete( id->p_decoder->p_description );
304 id->p_decoder->p_description = NULL;
307 if( id->p_encoder->p_module )
308 module_unneed( id->p_encoder, id->p_encoder->p_module );
309 id->p_encoder->p_module = NULL;
313 filter_chain_Delete( id->p_uf_chain );
315 filter_chain_Delete( id->p_f_chain );
318 int transcode_audio_process( sout_stream_t *p_stream,
319 sout_stream_id_t *id,
320 block_t *in, block_t **out )
322 sout_stream_sys_t *p_sys = p_stream->p_sys;
323 block_t *p_block, *p_audio_buf;
326 if( unlikely( in == NULL ) )
330 p_block = id->p_encoder->pf_encode_audio(id->p_encoder, NULL );
331 block_ChainAppend( out, p_block );
336 while( (p_audio_buf = id->p_decoder->pf_decode_audio( id->p_decoder,
339 if( p_sys->b_master_sync )
341 mtime_t i_pts = date_Get( &id->interpolated_pts ) + 1;
342 mtime_t i_drift = p_audio_buf->i_pts - i_pts;
343 if (i_drift > MASTER_SYNC_MAX_DRIFT || i_drift < -MASTER_SYNC_MAX_DRIFT)
346 "drift is too high (%"PRId64"), resetting master sync",
348 date_Set( &id->interpolated_pts, p_audio_buf->i_pts );
349 i_pts = p_audio_buf->i_pts + 1;
351 p_sys->i_master_drift = p_audio_buf->i_pts - i_pts;
352 date_Increment( &id->interpolated_pts, p_audio_buf->i_nb_samples );
353 p_audio_buf->i_pts = i_pts;
356 p_audio_buf->i_dts = p_audio_buf->i_pts;
358 /* Run filter chain */
361 p_audio_buf = filter_chain_AudioFilter( id->p_uf_chain,
367 p_audio_buf = filter_chain_AudioFilter( id->p_f_chain, p_audio_buf );
371 p_audio_buf->i_dts = p_audio_buf->i_pts;
373 p_block = id->p_encoder->pf_encode_audio( id->p_encoder, p_audio_buf );
375 block_ChainAppend( out, p_block );
376 block_Release( p_audio_buf );
382 bool transcode_audio_add( sout_stream_t *p_stream, es_format_t *p_fmt,
383 sout_stream_id_t *id )
385 sout_stream_sys_t *p_sys = p_stream->p_sys;
388 "creating audio transcoding from fcc=`%4.4s' to fcc=`%4.4s'",
389 (char*)&p_fmt->i_codec, (char*)&p_sys->i_acodec );
391 /* Complete destination format */
392 id->p_encoder->fmt_out.i_codec = p_sys->i_acodec;
393 id->p_encoder->fmt_out.audio.i_rate = p_sys->i_sample_rate > 0 ?
394 p_sys->i_sample_rate : p_fmt->audio.i_rate;
395 id->p_encoder->fmt_out.i_bitrate = p_sys->i_abitrate;
396 id->p_encoder->fmt_out.audio.i_bitspersample =
397 p_fmt->audio.i_bitspersample;
398 id->p_encoder->fmt_out.audio.i_channels = p_sys->i_channels > 0 ?
399 p_sys->i_channels : p_fmt->audio.i_channels;
400 /* Sanity check for audio channels */
401 id->p_encoder->fmt_out.audio.i_channels =
402 __MIN( id->p_encoder->fmt_out.audio.i_channels,
403 id->p_decoder->fmt_in.audio.i_channels );
404 id->p_encoder->fmt_out.audio.i_original_channels =
405 id->p_decoder->fmt_in.audio.i_physical_channels;
406 if( id->p_decoder->fmt_in.audio.i_channels ==
407 id->p_encoder->fmt_out.audio.i_channels )
409 id->p_encoder->fmt_out.audio.i_physical_channels =
410 id->p_decoder->fmt_in.audio.i_physical_channels;
414 id->p_encoder->fmt_out.audio.i_physical_channels =
415 pi_channels_maps[id->p_encoder->fmt_out.audio.i_channels];
418 /* Build decoder -> filter -> encoder chain */
419 if( transcode_audio_new( p_stream, id ) )
421 msg_Err( p_stream, "cannot create audio chain" );
425 /* Open output stream */
426 id->id = sout_StreamIdAdd( p_stream->p_next, &id->p_encoder->fmt_out );
427 id->b_transcode = true;
431 transcode_audio_close( id );
435 date_Init( &id->interpolated_pts, p_fmt->audio.i_rate, 1 );