]> git.sesse.net Git - vlc/blob - modules/packetizer/h264.c
* all: fixed the way h264 streams are stored in .mp4
[vlc] / modules / packetizer / h264.c
1 /*****************************************************************************
2  * h264.c: h264/avc video packetizer
3  *****************************************************************************
4  * Copyright (C) 2001, 2002 VideoLAN
5  * $Id$
6  *
7  * Authors: Laurent Aimar <fenrir@via.ecp.fr>
8  *          Eric Petit <titer@videolan.org>
9  *          Gildas Bazin <gbazin@netcourrier.com>
10  *
11  * This program is free software; you can redistribute it and/or modify
12  * it under the terms of the GNU General Public License as published by
13  * the Free Software Foundation; either version 2 of the License, or
14  * (at your option) any later version.
15  *
16  * This program is distributed in the hope that it will be useful,
17  * but WITHOUT ANY WARRANTY; without even the implied warranty of
18  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
19  * GNU General Public License for more details.
20  *
21  * You should have received a copy of the GNU General Public License
22  * along with this program; if not, write to the Free Software
23  * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111, USA.
24  *****************************************************************************/
25
26 /*****************************************************************************
27  * Preamble
28  *****************************************************************************/
29 #include <stdlib.h>                                      /* malloc(), free() */
30
31 #include <vlc/vlc.h>
32 #include <vlc/decoder.h>
33 #include <vlc/sout.h>
34
35 #include "vlc_block_helper.h"
36 #include "vlc_bits.h"
37
38 /*****************************************************************************
39  * Module descriptor
40  *****************************************************************************/
41 static int  Open ( vlc_object_t * );
42 static void Close( vlc_object_t * );
43
44 vlc_module_begin();
45     set_description( _("H264 video packetizer") );
46     set_capability( "packetizer", 50 );
47     set_callbacks( Open, Close );
48 vlc_module_end();
49
50
51 /****************************************************************************
52  * Local prototypes
53  ****************************************************************************/
54 static block_t *Packetize( decoder_t *, block_t ** );
55 static block_t *PacketizeAVC1( decoder_t *, block_t ** );
56
57 struct decoder_sys_t
58 {
59     block_bytestream_t bytestream;
60
61     int     i_state;
62     int     i_offset;
63     uint8_t startcode[4];
64
65     vlc_bool_t b_slice;
66     block_t    *p_frame;
67
68     int64_t      i_dts;
69     int64_t      i_pts;
70     unsigned int i_flags;
71
72     vlc_bool_t   b_sps;
73
74     /* avcC data */
75     int i_avcC_length_size;
76 };
77
78 enum
79 {
80     STATE_NOSYNC,
81     STATE_NEXT_SYNC,
82 };
83
84 enum nal_unit_type_e
85 {
86     NAL_UNKNOWN = 0,
87     NAL_SLICE   = 1,
88     NAL_SLICE_DPA   = 2,
89     NAL_SLICE_DPB   = 3,
90     NAL_SLICE_DPC   = 4,
91     NAL_SLICE_IDR   = 5,    /* ref_idc != 0 */
92     NAL_SEI         = 6,    /* ref_idc == 0 */
93     NAL_SPS         = 7,
94     NAL_PPS         = 8
95     /* ref_idc == 0 for 6,9,10,11,12 */
96 };
97
98 enum nal_priority_e
99 {
100     NAL_PRIORITY_DISPOSABLE = 0,
101     NAL_PRIORITY_LOW        = 1,
102     NAL_PRIORITY_HIGH       = 2,
103     NAL_PRIORITY_HIGHEST    = 3,
104 };
105
106 static block_t *ParseNALBlock( decoder_t *, block_t * );
107
108 static block_t *nal_get_annexeb( decoder_t *, uint8_t *p, int );
109
110 /*****************************************************************************
111  * Open: probe the packetizer and return score
112  *****************************************************************************/
113 static int Open( vlc_object_t *p_this )
114 {
115     decoder_t     *p_dec = (decoder_t*)p_this;
116     decoder_sys_t *p_sys;
117
118     if( p_dec->fmt_in.i_codec != VLC_FOURCC( 'h', '2', '6', '4') &&
119         p_dec->fmt_in.i_codec != VLC_FOURCC( 'H', '2', '6', '4') &&
120         p_dec->fmt_in.i_codec != VLC_FOURCC( 'V', 'S', 'S', 'H') &&
121         p_dec->fmt_in.i_codec != VLC_FOURCC( 'v', 's', 's', 'h') &&
122         ( p_dec->fmt_in.i_codec != VLC_FOURCC( 'a', 'v', 'c', '1') || p_dec->fmt_in.i_extra < 7 ) )
123     {
124         return VLC_EGENERIC;
125     }
126
127     /* Allocate the memory needed to store the decoder's structure */
128     if( ( p_dec->p_sys = p_sys = malloc( sizeof(decoder_sys_t) ) ) == NULL )
129     {
130         msg_Err( p_dec, "out of memory" );
131         return VLC_EGENERIC;
132     }
133     p_sys->i_state = STATE_NOSYNC;
134     p_sys->i_offset = 0;
135     p_sys->startcode[0] = 0;
136     p_sys->startcode[1] = 0;
137     p_sys->startcode[2] = 0;
138     p_sys->startcode[3] = 1;
139     p_sys->bytestream = block_BytestreamInit( p_dec );
140     p_sys->b_slice = VLC_FALSE;
141     p_sys->p_frame = NULL;
142     p_sys->i_dts   = 0;
143     p_sys->i_pts   = 0;
144     p_sys->i_flags = 0;
145     p_sys->b_sps   = VLC_FALSE;
146
147     /* Setup properties */
148     es_format_Copy( &p_dec->fmt_out, &p_dec->fmt_in );
149     p_dec->fmt_out.i_codec = VLC_FOURCC( 'h', '2', '6', '4' );
150
151     if( p_dec->fmt_in.i_codec == VLC_FOURCC( 'a', 'v', 'c', '1' ) )
152     {
153         uint8_t *p = &((uint8_t*)p_dec->fmt_in.p_extra)[4];
154         int i_sps, i_pps;
155         int i;
156
157         /* Parse avcC */
158         p_sys->i_avcC_length_size = 1 + ((*p++)&0x03);
159
160         /* Read SPS */
161         i_sps = (*p++)&0x1f;
162
163         for( i = 0; i < i_sps; i++ )
164         {
165             int i_length = GetWBE( p );
166             block_t *p_sps = nal_get_annexeb( p_dec, p+2, i_length );
167
168             ParseNALBlock( p_dec, p_sps );
169             p += 2 + i_length;
170         }
171         /* Read PPS */
172         i_pps = *p++;
173         for( i = 0; i < i_pps; i++ )
174         {
175             int i_length = GetWBE( p );
176             block_t *p_pps = nal_get_annexeb( p_dec, p+2, i_length );
177
178             ParseNALBlock( p_dec, p_pps );
179             p += 2 + i_length;
180         }
181         msg_Dbg( p_dec, "avcC length size=%d sps=%d pps=%d",
182                  p_sys->i_avcC_length_size, i_sps, i_pps );
183
184         /* Set callback */
185         p_dec->pf_packetize = PacketizeAVC1;
186     }
187     else
188     {
189         /* Set callback */
190         p_dec->pf_packetize = Packetize;
191     }
192
193     return VLC_SUCCESS;
194 }
195
196 /*****************************************************************************
197  * Close: clean up the packetizer
198  *****************************************************************************/
199 static void Close( vlc_object_t *p_this )
200 {
201     decoder_t *p_dec = (decoder_t*)p_this;
202     decoder_sys_t *p_sys = p_dec->p_sys;
203
204     block_BytestreamRelease( &p_sys->bytestream );
205     free( p_sys );
206 }
207
208 /****************************************************************************
209  * Packetize: the whole thing
210  ****************************************************************************/
211 static block_t *Packetize( decoder_t *p_dec, block_t **pp_block )
212 {
213     decoder_sys_t *p_sys = p_dec->p_sys;
214     block_t       *p_pic;
215
216     if( !pp_block || !*pp_block ) return NULL;
217
218     block_BytestreamPush( &p_sys->bytestream, *pp_block );
219
220     for( ;; )
221     {
222         switch( p_sys->i_state )
223         {
224             case STATE_NOSYNC:
225                 if( block_FindStartcodeFromOffset( &p_sys->bytestream,
226                         &p_sys->i_offset, p_sys->startcode, 4 ) == VLC_SUCCESS )
227                 {
228                     p_sys->i_state = STATE_NEXT_SYNC;
229                 }
230
231                 if( p_sys->i_offset )
232                 {
233                     block_SkipBytes( &p_sys->bytestream, p_sys->i_offset );
234                     p_sys->i_offset = 0;
235                     block_BytestreamFlush( &p_sys->bytestream );
236                 }
237
238                 if( p_sys->i_state != STATE_NEXT_SYNC )
239                 {
240                     /* Need more data */
241                     return NULL;
242                 }
243
244                 p_sys->i_offset = 1; /* To find next startcode */
245
246             case STATE_NEXT_SYNC:
247                 /* Find the next startcode */
248                 if( block_FindStartcodeFromOffset( &p_sys->bytestream,
249                         &p_sys->i_offset, p_sys->startcode, 4 ) != VLC_SUCCESS )
250                 {
251                     /* Need more data */
252                     return NULL;
253                 }
254
255                 /* Get the new fragment and set the pts/dts */
256                 p_pic = block_New( p_dec, p_sys->i_offset );
257                 p_pic->i_pts = p_sys->bytestream.p_block->i_pts;
258                 p_pic->i_dts = p_sys->bytestream.p_block->i_dts;
259
260                 block_GetBytes( &p_sys->bytestream, p_pic->p_buffer,
261                                 p_pic->i_buffer );
262
263                 p_sys->i_offset = 0;
264
265                 /* Parse the NAL */
266                 if( !( p_pic = ParseNALBlock( p_dec, p_pic ) ) )
267                 {
268                     p_sys->i_state = STATE_NOSYNC;
269                     break;
270                 }
271
272                 /* So p_block doesn't get re-added several times */
273                 *pp_block = block_BytestreamPop( &p_sys->bytestream );
274
275                 p_sys->i_state = STATE_NOSYNC;
276
277                 return p_pic;
278         }
279     }
280 }
281
282 /****************************************************************************
283  * PacketizeAVC1: the whole thing
284  ****************************************************************************/
285 static block_t *PacketizeAVC1( decoder_t *p_dec, block_t **pp_block )
286 {
287     decoder_sys_t *p_sys = p_dec->p_sys;
288     block_t       *p_block;
289     block_t       *p_ret = NULL;
290     uint8_t       *p;
291
292     if( !pp_block || !*pp_block ) return NULL;
293
294     p_block = *pp_block;
295     *pp_block = NULL;
296
297     for( p = p_block->p_buffer; p < &p_block->p_buffer[p_block->i_buffer]; )
298     {
299         block_t *p_pic;
300         int i_size = 0;
301         int i;
302
303         for( i = 0; i < p_sys->i_avcC_length_size; i++ )
304         {
305             i_size = (i_size << 8) | (*p++);
306         }
307
308         if( i_size > 0 )
309         {
310             block_t *p_part = nal_get_annexeb( p_dec, p, i_size );
311
312             p_part->i_dts = p_block->i_dts;
313             p_part->i_pts = p_block->i_pts;
314             /* Parse the NAL */
315             if( ( p_pic = ParseNALBlock( p_dec, p_part ) ) )
316             {
317                 block_ChainAppend( &p_ret, p_pic );
318             }
319         }
320         p += i_size;
321     }
322
323     return p_ret;
324 }
325
326 static block_t *nal_get_annexeb( decoder_t *p_dec, uint8_t *p, int i_size )
327 {
328     block_t *p_nal;
329
330     p_nal = block_New( p_dec, 4 + i_size );
331
332     /* Add start code */
333     p_nal->p_buffer[0] = 0x00;
334     p_nal->p_buffer[1] = 0x00;
335     p_nal->p_buffer[2] = 0x00;
336     p_nal->p_buffer[3] = 0x01;
337     /* Copy nalu */
338     memcpy( &p_nal->p_buffer[4], p, i_size );
339
340     return p_nal;
341 }
342
343 static void nal_get_decoded( uint8_t **pp_ret, int *pi_ret, uint8_t *src, int i_src )
344 {
345     uint8_t *end = &src[i_src];
346     uint8_t *dst = malloc( i_src );
347
348     *pp_ret = dst;
349
350     while( src < end )
351     {
352         if( src < end - 3 && src[0] == 0x00 && src[1] == 0x00  && src[2] == 0x03 )
353         {
354             *dst++ = 0x00;
355             *dst++ = 0x00;
356
357             src += 3;
358             continue;
359         }
360         *dst++ = *src++;
361     }
362
363     *pi_ret = dst - *pp_ret;
364 }
365
366 static inline int bs_read_ue( bs_t *s )
367 {
368     int i = 0;
369
370     while( bs_read1( s ) == 0 && s->p < s->p_end && i < 32 )
371     {
372         i++;
373     }
374     return( ( 1 << i) - 1 + bs_read( s, i ) );
375 }
376 static inline int bs_read_se( bs_t *s )
377 {
378     int val = bs_read_ue( s );
379
380     return val&0x01 ? (val+1)/2 : -(val/2);
381 }
382
383
384 static block_t *ParseNALBlock( decoder_t *p_dec, block_t *p_frag )
385 {
386     decoder_sys_t *p_sys = p_dec->p_sys;
387     block_t *p_pic = NULL;
388
389     const int i_ref_idc = (p_frag->p_buffer[4] >> 5)&0x03;
390     const int i_nal_type= p_frag->p_buffer[4]&0x1f;
391
392     if( p_sys->b_slice &&
393         ( i_nal_type == NAL_SLICE || i_nal_type == NAL_SLICE_IDR ||
394           i_nal_type == NAL_SLICE_DPC || i_nal_type == NAL_SPS || i_nal_type == NAL_PPS ) )
395     {
396         if( p_sys->b_sps )
397         {
398             p_pic = block_ChainGather( p_sys->p_frame );
399             p_pic->i_dts = p_sys->i_dts;
400             p_pic->i_pts = p_sys->i_pts;
401             p_pic->i_length = 0;    /* FIXME */
402             p_pic->i_flags = p_sys->i_flags;
403         }
404         else
405         {
406             block_ChainRelease( p_sys->p_frame );
407             msg_Warn( p_dec, "waiting SPS" );
408         }
409
410         /* reset context */
411         p_sys->p_frame = NULL;
412         p_sys->b_slice = VLC_FALSE;
413         //p_sys->i_dts += 40000;
414     }
415
416     if( i_nal_type >= NAL_SLICE && i_nal_type <= NAL_SLICE_IDR )
417     {
418         uint8_t *dec;
419         int     i_dec;
420         bs_t s;
421
422         p_sys->b_slice = VLC_TRUE;
423         p_sys->i_dts   = p_frag->i_dts;
424         p_sys->i_pts   = p_frag->i_pts;
425
426         /* do not convert the whole frame */
427         nal_get_decoded( &dec, &i_dec, &p_frag->p_buffer[5], __MIN( p_frag->i_buffer - 5, 60 ) );
428         bs_init( &s, dec, i_dec );
429
430         /* i_first_mb */
431         bs_read_ue( &s );
432         /* picture type */
433         switch( bs_read_ue( &s ) )
434         {
435             case 0: case 5:
436                 p_sys->i_flags = BLOCK_FLAG_TYPE_P;
437                 break;
438             case 1: case 6:
439                 p_sys->i_flags =BLOCK_FLAG_TYPE_B;
440                 break;
441             case 2: case 7:
442                 p_sys->i_flags = BLOCK_FLAG_TYPE_I;
443                 break;
444             case 3: case 8: /* SP */
445                 p_sys->i_flags = BLOCK_FLAG_TYPE_P;
446                 break;
447             case 4: case 9:
448                 p_sys->i_flags = BLOCK_FLAG_TYPE_I;
449                 break;
450         }
451
452         free( dec );
453     }
454     else if( i_nal_type == NAL_SPS )
455     {
456         uint8_t *dec;
457         int     i_dec;
458         bs_t s;
459         int i_tmp;
460
461         p_sys->b_sps = VLC_TRUE;
462
463         nal_get_decoded( &dec, &i_dec, &p_frag->p_buffer[5], p_frag->i_buffer - 5 );
464
465         bs_init( &s, dec, i_dec );
466         /* Skip profile(8), constraint_set012, reserver(5), level(8) */
467         bs_skip( &s, 8 + 1+1+1 + 5 + 8 );
468         /* sps id */
469         bs_read_ue( &s );
470         /* Skip i_log2_max_frame_num */
471         bs_read_ue( &s );
472         /* Read poc_type */
473         i_tmp = bs_read_ue( &s );
474         if( i_tmp == 0 )
475         {
476             /* skip i_log2_max_poc_lsb */
477             bs_read_ue( &s );
478         }
479         else if( i_tmp == 1 )
480         {
481             int i_cycle;
482             /* skip b_delta_pic_order_always_zero */
483             bs_skip( &s, 1 );
484             /* skip i_offset_for_non_ref_pic */
485             bs_read_se( &s );
486             /* skip i_offset_for_top_to_bottom_field */
487             bs_read_se( &s );
488             /* read i_num_ref_frames_in_poc_cycle */
489             i_cycle = bs_read_ue( &s );
490             if( i_cycle > 256 ) i_cycle = 256;
491             while( i_cycle > 0 )
492             {
493                 /* skip i_offset_for_ref_frame */
494                 bs_read_se(&s );
495             }
496         }
497         /* i_num_ref_frames */
498         bs_read_ue( &s );
499         /* b_gaps_in_frame_num_value_allowed */
500         bs_skip( &s, 1 );
501
502         /* Read size */
503         p_dec->fmt_out.video.i_width  = 16 * ( bs_read_ue( &s ) + 1 );
504         p_dec->fmt_out.video.i_height = 16 * ( bs_read_ue( &s ) + 1 );
505
506         /* b_frame_mbs_only */
507         i_tmp = bs_read( &s, 1 );
508         if( i_tmp == 0 )
509         {
510             bs_skip( &s, 1 );
511         }
512         /* b_direct8x8_inference */
513         bs_skip( &s, 1 );
514
515         /* crop ? */
516         i_tmp = bs_read( &s, 1 );
517         if( i_tmp )
518         {
519             /* left */
520             p_dec->fmt_out.video.i_width -= 2 * bs_read_ue( &s );
521             /* right */
522             p_dec->fmt_out.video.i_width -= 2 * bs_read_ue( &s );
523             /* top */
524             p_dec->fmt_out.video.i_height -= 2 * bs_read_ue( &s );
525             /* bottom */
526             p_dec->fmt_out.video.i_height -= 2 * bs_read_ue( &s );
527         }
528
529         /* vui */
530         i_tmp = bs_read( &s, 1 );
531         if( i_tmp )
532         {
533             /* read the aspect ratio part if any FIXME check it */
534             i_tmp = bs_read( &s, 1 );
535             if( i_tmp )
536             {
537                 static const struct { int w, h; } sar[14] =
538                 {
539                     { 0,   0 }, { 1,   1 }, { 12, 11 }, { 10, 11 },
540                     { 16, 11 }, { 40, 33 }, { 24, 11 }, { 20, 11 },
541                     { 32, 11 }, { 80, 33 }, { 18, 11 }, { 15, 11 },
542                     { 64, 33 }, { 160,99 },
543                 };
544                 int i_sar = bs_read( &s, 8 );
545                 int w, h;
546
547                 if( i_sar < 14 )
548                 {
549                     w = sar[i_sar].w;
550                     h = sar[i_sar].h;
551                 }
552                 else
553                 {
554                     w = bs_read( &s, 16 );
555                     h = bs_read( &s, 16 );
556                 }
557                 p_dec->fmt_out.video.i_aspect =
558                     VOUT_ASPECT_FACTOR *
559                     w / h *
560                     p_dec->fmt_out.video.i_width / p_dec->fmt_out.video.i_height;
561             }
562         }
563
564         free( dec );
565     }
566     else if( i_nal_type == NAL_PPS )
567     {
568         bs_t s;
569         bs_init( &s, &p_frag->p_buffer[5], p_frag->i_buffer - 5 );
570
571         /* TODO */
572     }
573
574
575     /* Append the block */
576     block_ChainAppend( &p_sys->p_frame, p_frag );
577
578     return p_pic;
579 }
580