]> git.sesse.net Git - vlc/blob - modules/stream_out/transcode/audio.c
5f7530ef4ca2f8510255a5882b118f465674aae0
[vlc] / modules / stream_out / transcode / audio.c
1 /*****************************************************************************
2  * audio.c: transcoding stream output module (audio)
3  *****************************************************************************
4  * Copyright (C) 2003-2009 the VideoLAN team
5  * $Id$
6  *
7  * Authors: Laurent Aimar <fenrir@via.ecp.fr>
8  *          Gildas Bazin <gbazin@videolan.org>
9  *          Jean-Paul Saman <jpsaman #_at_# m2x dot nl>
10  *          Antoine Cellerier <dionoea at videolan dot org>
11  *
12  * This program is free software; you can redistribute it and/or modify
13  * it under the terms of the GNU General Public License as published by
14  * the Free Software Foundation; either version 2 of the License, or
15  * (at your option) any later version.
16  *
17  * This program is distributed in the hope that it will be useful,
18  * but WITHOUT ANY WARRANTY; without even the implied warranty of
19  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
20  * GNU General Public License for more details.
21  *
22  * You should have received a copy of the GNU General Public License
23  * along with this program; if not, write to the Free Software
24  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
25  *****************************************************************************/
26
27 /*****************************************************************************
28  * Preamble
29  *****************************************************************************/
30
31 #include "transcode.h"
32
33 #include <vlc_aout.h>
34 #include <vlc_meta.h>
35
36 static const int pi_channels_maps[6] =
37 {
38     0,
39     AOUT_CHAN_CENTER,   AOUT_CHAN_LEFT | AOUT_CHAN_RIGHT,
40     AOUT_CHAN_CENTER | AOUT_CHAN_LEFT | AOUT_CHAN_RIGHT,
41     AOUT_CHAN_LEFT | AOUT_CHAN_RIGHT | AOUT_CHAN_REARLEFT
42      | AOUT_CHAN_REARRIGHT,
43     AOUT_CHAN_LEFT | AOUT_CHAN_RIGHT | AOUT_CHAN_CENTER
44      | AOUT_CHAN_REARLEFT | AOUT_CHAN_REARRIGHT
45 };
46
47 static inline void audio_timer_start( encoder_t * p_encoder )
48 {
49     stats_TimerStart( p_encoder, "encoding audio frame",
50                       STATS_TIMER_AUDIO_FRAME_ENCODING );
51 }
52
53 static inline void audio_timer_stop( encoder_t * p_encoder )
54 {
55     stats_TimerStop( p_encoder, STATS_TIMER_AUDIO_FRAME_ENCODING );
56 }
57
58 static inline void audio_timer_close( encoder_t * p_encoder )
59 {
60     stats_TimerDump(  p_encoder, STATS_TIMER_AUDIO_FRAME_ENCODING );
61     stats_TimerClean( p_encoder, STATS_TIMER_AUDIO_FRAME_ENCODING );
62 }
63
64 static block_t *transcode_audio_alloc( filter_t *p_filter, int size )
65 {
66     VLC_UNUSED( p_filter );
67     return block_Alloc( size );
68 }
69
70 static aout_buffer_t *audio_new_buffer( decoder_t *p_dec, int i_samples )
71 {
72     block_t *p_block;
73     int i_size;
74
75     if( p_dec->fmt_out.audio.i_bitspersample )
76     {
77         i_size = i_samples * p_dec->fmt_out.audio.i_bitspersample / 8 *
78             p_dec->fmt_out.audio.i_channels;
79     }
80     else if( p_dec->fmt_out.audio.i_bytes_per_frame &&
81              p_dec->fmt_out.audio.i_frame_length )
82     {
83         i_size = i_samples * p_dec->fmt_out.audio.i_bytes_per_frame /
84             p_dec->fmt_out.audio.i_frame_length;
85     }
86     else
87     {
88         i_size = i_samples * 4 * p_dec->fmt_out.audio.i_channels;
89     }
90
91     p_block = block_New( p_dec, i_size );
92     p_block->i_nb_samples = i_samples;
93     return p_block;
94 }
95
96 static void audio_del_buffer( decoder_t *p_dec, aout_buffer_t *p_buffer )
97 {
98     VLC_UNUSED(p_dec);
99     block_Release( p_buffer );
100 }
101
102 static int transcode_audio_filter_allocation_init( filter_t *p_filter,
103                                                    void *data )
104 {
105     VLC_UNUSED(data);
106     p_filter->pf_audio_buffer_new = transcode_audio_alloc;
107     return VLC_SUCCESS;
108 }
109
110 static bool transcode_audio_filter_needed( const es_format_t *p_fmt1, const es_format_t *p_fmt2 )
111 {
112     if( p_fmt1->i_codec != p_fmt2->i_codec ||
113         p_fmt1->audio.i_channels != p_fmt2->audio.i_channels ||
114         p_fmt1->audio.i_rate != p_fmt2->audio.i_rate )
115         return true;
116     return false;
117 }
118 static int transcode_audio_filter_chain_build( sout_stream_t *p_stream, filter_chain_t *p_chain,
119                                                const es_format_t *p_dst, const es_format_t *p_src )
120 {
121     if( !transcode_audio_filter_needed( p_dst, p_src ) )
122         return VLC_SUCCESS;
123
124     es_format_t current = *p_src;
125
126     msg_Dbg( p_stream, "Looking for filter "
127              "(%4.4s->%4.4s, channels %d->%d, rate %d->%d)",
128          (const char *)&p_src->i_codec,
129          (const char *)&p_dst->i_codec,
130          p_src->audio.i_channels,
131          p_dst->audio.i_channels,
132          p_src->audio.i_rate,
133          p_dst->audio.i_rate );
134
135     /* If any filter is needed, convert to fl32 */
136     if( current.i_codec != VLC_CODEC_FL32 )
137     {
138         /* First step, convert to fl32 */
139         current.i_codec =
140         current.audio.i_format = VLC_CODEC_FL32;
141         aout_FormatPrepare( &current.audio );
142
143         if( !filter_chain_AppendFilter( p_chain, NULL, NULL, NULL, &current ) )
144         {
145             msg_Err( p_stream, "Failed to find conversion filter to fl32" );
146             return VLC_EGENERIC;
147         }
148         current = *filter_chain_GetFmtOut( p_chain );
149     }
150
151     /* Fix sample rate */
152     if( current.audio.i_rate != p_dst->audio.i_rate )
153     {
154         current.audio.i_rate = p_dst->audio.i_rate;
155         aout_FormatPrepare( &current.audio );
156         if( !filter_chain_AppendFilter( p_chain, NULL, NULL, NULL, &current ) )
157         {
158             msg_Err( p_stream, "Failed to find conversion filter for resampling" );
159             return VLC_EGENERIC;
160         }
161         current = *filter_chain_GetFmtOut( p_chain );
162     }
163
164     /* Fix channels */
165     if( current.audio.i_channels != p_dst->audio.i_channels )
166     {
167         current.audio.i_channels = p_dst->audio.i_channels;
168         current.audio.i_physical_channels = p_dst->audio.i_physical_channels;
169         current.audio.i_original_channels = p_dst->audio.i_original_channels;
170
171         if( ( !current.audio.i_physical_channels || !current.audio.i_original_channels ) &&
172             current.audio.i_channels < 6 )
173             current.audio.i_physical_channels =
174             current.audio.i_original_channels = pi_channels_maps[current.audio.i_channels];
175
176         aout_FormatPrepare( &current.audio );
177         if( !filter_chain_AppendFilter( p_chain, NULL, NULL, NULL, &current ) )
178         {
179             msg_Err( p_stream, "Failed to find conversion filter for channel mixing" );
180             return VLC_EGENERIC;
181         }
182         current = *filter_chain_GetFmtOut( p_chain );
183     }
184     /* And last step, convert to the requested codec */
185     if( current.i_codec != p_dst->i_codec )
186     {
187         current.i_codec = p_dst->i_codec;
188         aout_FormatPrepare( &current.audio );
189         if( !filter_chain_AppendFilter( p_chain, NULL, NULL, NULL, &current ) )
190         {
191             msg_Err( p_stream, "Failed to find conversion filter to %4.4s",
192                      (const char*)&p_dst->i_codec);
193             return VLC_EGENERIC;
194         }
195         current = *filter_chain_GetFmtOut( p_chain );
196     }
197
198     if( transcode_audio_filter_needed( p_dst, &current ) )
199     {
200         /* Weird case, a filter has side effects, doomed */
201         msg_Err( p_stream, "Failed to create a valid audio filter chain" );
202         return VLC_EGENERIC;
203     }
204
205     msg_Dbg( p_stream, "Got complete audio filter chain" );
206     return VLC_SUCCESS;
207 }
208
209
210 int transcode_audio_new( sout_stream_t *p_stream,
211                                 sout_stream_id_t *id )
212 {
213     sout_stream_sys_t *p_sys = p_stream->p_sys;
214     es_format_t fmt_last;
215
216     /*
217      * Open decoder
218      */
219
220     /* Initialization of decoder structures */
221     id->p_decoder->fmt_out = id->p_decoder->fmt_in;
222     id->p_decoder->fmt_out.i_extra = 0;
223     id->p_decoder->fmt_out.p_extra = 0;
224     id->p_decoder->pf_decode_audio = NULL;
225     id->p_decoder->pf_aout_buffer_new = audio_new_buffer;
226     id->p_decoder->pf_aout_buffer_del = audio_del_buffer;
227     /* id->p_decoder->p_cfg = p_sys->p_audio_cfg; */
228
229     id->p_decoder->p_module =
230         module_need( id->p_decoder, "decoder", "$codec", false );
231     if( !id->p_decoder->p_module )
232     {
233         msg_Err( p_stream, "cannot find audio decoder" );
234         return VLC_EGENERIC;
235     }
236     id->p_decoder->fmt_out.audio.i_bitspersample =
237         aout_BitsPerSample( id->p_decoder->fmt_out.i_codec );
238     fmt_last = id->p_decoder->fmt_out;
239     /* Fix AAC SBR changing number of channels and sampling rate */
240     if( !(id->p_decoder->fmt_in.i_codec == VLC_CODEC_MP4A &&
241         fmt_last.audio.i_rate != id->p_encoder->fmt_in.audio.i_rate &&
242         fmt_last.audio.i_channels != id->p_encoder->fmt_in.audio.i_channels) )
243         fmt_last.audio.i_rate = id->p_decoder->fmt_in.audio.i_rate;
244
245     /*
246      * Open encoder
247      */
248
249     /* Initialization of encoder format structures */
250     es_format_Init( &id->p_encoder->fmt_in, id->p_decoder->fmt_in.i_cat,
251                     id->p_decoder->fmt_out.i_codec );
252     id->p_encoder->fmt_in.audio.i_format = id->p_decoder->fmt_out.i_codec;
253
254     id->p_encoder->fmt_in.audio.i_rate = id->p_encoder->fmt_out.audio.i_rate;
255     id->p_encoder->fmt_in.audio.i_physical_channels =
256         id->p_encoder->fmt_out.audio.i_physical_channels;
257     id->p_encoder->fmt_in.audio.i_original_channels =
258         id->p_encoder->fmt_out.audio.i_original_channels;
259     id->p_encoder->fmt_in.audio.i_channels =
260         id->p_encoder->fmt_out.audio.i_channels;
261     id->p_encoder->fmt_in.audio.i_bitspersample =
262         aout_BitsPerSample( id->p_encoder->fmt_in.i_codec );
263
264     id->p_encoder->p_cfg = p_stream->p_sys->p_audio_cfg;
265     id->p_encoder->p_module =
266         module_need( id->p_encoder, "encoder", p_sys->psz_aenc, true );
267     if( !id->p_encoder->p_module )
268     {
269         msg_Err( p_stream, "cannot find audio encoder (module:%s fourcc:%4.4s). Take a look few lines earlier to see possible reason.",
270                  p_sys->psz_aenc ? p_sys->psz_aenc : "any",
271                  (char *)&p_sys->i_acodec );
272         module_unneed( id->p_decoder, id->p_decoder->p_module );
273         id->p_decoder->p_module = NULL;
274         return VLC_EGENERIC;
275     }
276     id->p_encoder->fmt_in.audio.i_format = id->p_encoder->fmt_in.i_codec;
277     id->p_encoder->fmt_in.audio.i_bitspersample =
278         aout_BitsPerSample( id->p_encoder->fmt_in.i_codec );
279
280     /* Load user specified audio filters */
281     if( p_sys->psz_af )
282     {
283         es_format_t fmt_fl32 = fmt_last;
284         fmt_fl32.i_codec =
285         fmt_fl32.audio.i_format = VLC_CODEC_FL32;
286         if( transcode_audio_filter_chain_build( p_stream, id->p_uf_chain,
287                                                 &fmt_fl32, &fmt_last ) )
288         {
289             transcode_audio_close( id );
290             return VLC_EGENERIC;
291         }
292         fmt_last = fmt_fl32;
293
294         id->p_uf_chain = filter_chain_New( p_stream, "audio filter", false,
295                                            transcode_audio_filter_allocation_init, NULL, NULL );
296         filter_chain_Reset( id->p_uf_chain, &fmt_last, &fmt_fl32 );
297         if( filter_chain_AppendFromString( id->p_uf_chain, p_sys->psz_af ) > 0 )
298             fmt_last = *filter_chain_GetFmtOut( id->p_uf_chain );
299     }
300
301     /* Load conversion filters */
302     id->p_f_chain = filter_chain_New( p_stream, "audio filter", true,
303                     transcode_audio_filter_allocation_init, NULL, NULL );
304     filter_chain_Reset( id->p_f_chain, &fmt_last, &id->p_encoder->fmt_in );
305
306     if( transcode_audio_filter_chain_build( p_stream, id->p_f_chain,
307                                             &id->p_encoder->fmt_in, &fmt_last ) )
308     {
309         transcode_audio_close( id );
310         return VLC_EGENERIC;
311     }
312     fmt_last = id->p_encoder->fmt_in;
313
314     /* */
315     id->p_encoder->fmt_out.i_codec =
316         vlc_fourcc_GetCodec( AUDIO_ES, id->p_encoder->fmt_out.i_codec );
317
318     return VLC_SUCCESS;
319 }
320
321 void transcode_audio_close( sout_stream_id_t *id )
322 {
323     audio_timer_close( id->p_encoder );
324
325     /* Close decoder */
326     if( id->p_decoder->p_module )
327         module_unneed( id->p_decoder, id->p_decoder->p_module );
328     id->p_decoder->p_module = NULL;
329
330     if( id->p_decoder->p_description )
331         vlc_meta_Delete( id->p_decoder->p_description );
332     id->p_decoder->p_description = NULL;
333
334     /* Close encoder */
335     if( id->p_encoder->p_module )
336         module_unneed( id->p_encoder, id->p_encoder->p_module );
337     id->p_encoder->p_module = NULL;
338
339     /* Close filters */
340     if( id->p_uf_chain )
341         filter_chain_Delete( id->p_uf_chain );
342     if( id->p_f_chain )
343         filter_chain_Delete( id->p_f_chain );
344 }
345
346 int transcode_audio_process( sout_stream_t *p_stream,
347                                     sout_stream_id_t *id,
348                                     block_t *in, block_t **out )
349 {
350     sout_stream_sys_t *p_sys = p_stream->p_sys;
351     block_t *p_block, *p_audio_buf;
352     *out = NULL;
353
354     while( (p_audio_buf = id->p_decoder->pf_decode_audio( id->p_decoder,
355                                                           &in )) )
356     {
357         sout_UpdateStatistic( p_stream->p_sout, SOUT_STATISTIC_DECODED_AUDIO, 1 );
358         if( p_sys->b_master_sync )
359         {
360             mtime_t i_dts = date_Get( &id->interpolated_pts ) + 1;
361             if ( p_audio_buf->i_pts - i_dts > MASTER_SYNC_MAX_DRIFT
362                   || p_audio_buf->i_pts - i_dts < -MASTER_SYNC_MAX_DRIFT )
363             {
364                 msg_Dbg( p_stream, "drift is too high, resetting master sync" );
365                 date_Set( &id->interpolated_pts, p_audio_buf->i_pts );
366                 i_dts = p_audio_buf->i_pts + 1;
367             }
368             p_sys->i_master_drift = p_audio_buf->i_pts - i_dts;
369             date_Increment( &id->interpolated_pts, p_audio_buf->i_nb_samples );
370             p_audio_buf->i_pts -= p_sys->i_master_drift;
371         }
372
373         p_audio_buf->i_dts = p_audio_buf->i_pts;
374
375         /* Run filter chain */
376         if( id->p_uf_chain )
377         {
378             p_audio_buf = filter_chain_AudioFilter( id->p_uf_chain,
379                                                     p_audio_buf );
380             if( !p_audio_buf )
381                 abort();
382         }
383
384         p_audio_buf = filter_chain_AudioFilter( id->p_f_chain, p_audio_buf );
385         if( !p_audio_buf )
386             abort();
387
388         p_audio_buf->i_dts = p_audio_buf->i_pts;
389
390         audio_timer_start( id->p_encoder );
391         p_block = id->p_encoder->pf_encode_audio( id->p_encoder, p_audio_buf );
392         audio_timer_stop( id->p_encoder );
393
394         block_ChainAppend( out, p_block );
395         block_Release( p_audio_buf );
396     }
397
398     return VLC_SUCCESS;
399 }
400
401 bool transcode_audio_add( sout_stream_t *p_stream, es_format_t *p_fmt, 
402             sout_stream_id_t *id )
403 {
404     sout_stream_sys_t *p_sys = p_stream->p_sys;
405
406     msg_Dbg( p_stream,
407              "creating audio transcoding from fcc=`%4.4s' to fcc=`%4.4s'",
408              (char*)&p_fmt->i_codec, (char*)&p_sys->i_acodec );
409
410     /* Complete destination format */
411     id->p_encoder->fmt_out.i_codec = p_sys->i_acodec;
412     id->p_encoder->fmt_out.audio.i_rate = p_sys->i_sample_rate > 0 ?
413         p_sys->i_sample_rate : p_fmt->audio.i_rate;
414     id->p_encoder->fmt_out.i_bitrate = p_sys->i_abitrate;
415     id->p_encoder->fmt_out.audio.i_bitspersample =
416         p_fmt->audio.i_bitspersample;
417     id->p_encoder->fmt_out.audio.i_channels = p_sys->i_channels > 0 ?
418         p_sys->i_channels : p_fmt->audio.i_channels;
419     /* Sanity check for audio channels */
420     id->p_encoder->fmt_out.audio.i_channels =
421         __MIN( id->p_encoder->fmt_out.audio.i_channels,
422                id->p_decoder->fmt_in.audio.i_channels );
423     id->p_encoder->fmt_out.audio.i_original_channels =
424         id->p_decoder->fmt_in.audio.i_physical_channels;
425     if( id->p_decoder->fmt_in.audio.i_channels ==
426         id->p_encoder->fmt_out.audio.i_channels )
427     {
428         id->p_encoder->fmt_out.audio.i_physical_channels =
429             id->p_decoder->fmt_in.audio.i_physical_channels;
430     }
431     else
432     {
433         id->p_encoder->fmt_out.audio.i_physical_channels =
434             pi_channels_maps[id->p_encoder->fmt_out.audio.i_channels];
435     }
436
437     /* Build decoder -> filter -> encoder chain */
438     if( transcode_audio_new( p_stream, id ) )
439     {
440         msg_Err( p_stream, "cannot create audio chain" );
441         return false;
442     }
443
444     /* Open output stream */
445     id->id = sout_StreamIdAdd( p_stream->p_next, &id->p_encoder->fmt_out );
446     id->b_transcode = true;
447
448     if( !id->id )
449     {
450         transcode_audio_close( id );
451         return false;
452     }
453
454     date_Init( &id->interpolated_pts, p_fmt->audio.i_rate, 1 );
455
456     return true;
457 }