1 /*****************************************************************************
2 * h264.c: h264/avc video packetizer
3 *****************************************************************************
4 * Copyright (C) 2001, 2002, 2006 the VideoLAN team
7 * Authors: Laurent Aimar <fenrir@via.ecp.fr>
8 * Eric Petit <titer@videolan.org>
9 * Gildas Bazin <gbazin@videolan.org>
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License as published by
13 * the Free Software Foundation; either version 2 of the License, or
14 * (at your option) any later version.
16 * This program is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19 * GNU General Public License for more details.
21 * You should have received a copy of the GNU General Public License
22 * along with this program; if not, write to the Free Software
23 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
24 *****************************************************************************/
26 /*****************************************************************************
28 *****************************************************************************/
29 #include <stdlib.h> /* malloc(), free() */
32 #include <vlc/decoder.h>
35 #include "vlc_block_helper.h"
38 /*****************************************************************************
40 *****************************************************************************/
41 static int Open ( vlc_object_t * );
42 static void Close( vlc_object_t * );
45 set_category( CAT_SOUT );
46 set_subcategory( SUBCAT_SOUT_PACKETIZER );
47 set_description( _("H.264 video packetizer") );
48 set_capability( "packetizer", 50 );
49 set_callbacks( Open, Close );
53 /****************************************************************************
55 ****************************************************************************/
56 static block_t *Packetize( decoder_t *, block_t ** );
57 static block_t *PacketizeAVC1( decoder_t *, block_t ** );
61 block_bytestream_t bytestream;
74 int i_avcC_length_size;
78 /* Useful values of the Sequence Parameter Set */
79 int i_log2_max_frame_num;
82 /* Useful values of the Slice Header */
103 NAL_SLICE_IDR = 5, /* ref_idc != 0 */
104 NAL_SEI = 6, /* ref_idc == 0 */
108 /* ref_idc == 0 for 6,9,10,11,12 */
113 NAL_PRIORITY_DISPOSABLE = 0,
114 NAL_PRIORITY_LOW = 1,
115 NAL_PRIORITY_HIGH = 2,
116 NAL_PRIORITY_HIGHEST = 3,
119 static block_t *ParseNALBlock( decoder_t *, block_t * );
121 static block_t *nal_get_annexeb( decoder_t *, uint8_t *p, int );
123 /*****************************************************************************
124 * Open: probe the packetizer and return score
125 * When opening after demux, the packetizer is only loaded AFTER the decoder
126 * That means that what you set in fmt_out is ignored by the decoder in this special case
127 *****************************************************************************/
128 static int Open( vlc_object_t *p_this )
130 decoder_t *p_dec = (decoder_t*)p_this;
131 decoder_sys_t *p_sys;
133 if( p_dec->fmt_in.i_codec != VLC_FOURCC( 'h', '2', '6', '4') &&
134 p_dec->fmt_in.i_codec != VLC_FOURCC( 'H', '2', '6', '4') &&
135 p_dec->fmt_in.i_codec != VLC_FOURCC( 'V', 'S', 'S', 'H') &&
136 p_dec->fmt_in.i_codec != VLC_FOURCC( 'v', 's', 's', 'h') &&
137 ( p_dec->fmt_in.i_codec != VLC_FOURCC( 'a', 'v', 'c', '1') ||
138 p_dec->fmt_in.i_extra < 7 ) )
143 /* Allocate the memory needed to store the decoder's structure */
144 if( ( p_dec->p_sys = p_sys = malloc( sizeof(decoder_sys_t) ) ) == NULL )
146 msg_Err( p_dec, "out of memory" );
149 p_sys->i_state = STATE_NOSYNC;
151 p_sys->startcode[0] = 0;
152 p_sys->startcode[1] = 0;
153 p_sys->startcode[2] = 0;
154 p_sys->startcode[3] = 1;
155 p_sys->bytestream = block_BytestreamInit( p_dec );
156 p_sys->b_slice = VLC_FALSE;
157 p_sys->p_frame = NULL;
158 p_sys->b_sps = VLC_FALSE;
159 p_sys->b_pps = VLC_FALSE;
163 p_sys->i_nal_type = -1;
164 p_sys->i_nal_ref_idc = -1;
165 p_sys->i_idr_pic_id = -1;
166 p_sys->i_frame_num = -1;
167 p_sys->i_frame_type = 0;
169 /* Setup properties */
170 es_format_Copy( &p_dec->fmt_out, &p_dec->fmt_in );
171 p_dec->fmt_out.i_codec = VLC_FOURCC( 'h', '2', '6', '4' );
173 if( p_dec->fmt_in.i_codec == VLC_FOURCC( 'a', 'v', 'c', '1' ) )
175 /* This type of stream is produced by mp4 and matroska
176 * when we want to store it in another streamformat, you need to convert
177 * The fmt_in.p_extra should ALWAYS contain the avcC
178 * The fmt_out.p_extra should contain all the SPS and PPS with 4 byte startcodes */
179 uint8_t *p = &((uint8_t*)p_dec->fmt_in.p_extra)[4];
184 p_sys->i_avcC_length_size = 1 + ((*p++)&0x03);
188 for( i = 0; i < i_sps; i++ )
190 int i_length = GetWBE( p );
191 block_t *p_sps = nal_get_annexeb( p_dec, p + 2, i_length );
193 p_sys->p_sps = block_Duplicate( p_sps );
194 p_sps->i_pts = p_sps->i_dts = mdate();
195 ParseNALBlock( p_dec, p_sps );
200 for( i = 0; i < i_pps; i++ )
202 int i_length = GetWBE( p );
203 block_t *p_pps = nal_get_annexeb( p_dec, p + 2, i_length );
205 p_sys->p_pps = block_Duplicate( p_pps );
206 p_pps->i_pts = p_pps->i_dts = mdate();
207 ParseNALBlock( p_dec, p_pps );
210 msg_Dbg( p_dec, "avcC length size=%d, sps=%d, pps=%d",
211 p_sys->i_avcC_length_size, i_sps, i_pps );
213 /* FIXME: FFMPEG isn't happy at all if you leave this */
214 if( p_dec->fmt_out.i_extra ) free( p_dec->fmt_out.p_extra );
215 p_dec->fmt_out.i_extra = 0; p_dec->fmt_out.p_extra = NULL;
217 /* Set the new extradata */
218 p_dec->fmt_out.i_extra = p_sys->p_pps->i_buffer + p_sys->p_sps->i_buffer;
219 p_dec->fmt_out.p_extra = (uint8_t*)malloc( p_dec->fmt_out.i_extra );
220 memcpy( p_dec->fmt_out.p_extra, p_sys->p_sps->p_buffer, p_sys->p_sps->i_buffer);
221 memcpy( p_dec->fmt_out.p_extra+p_sys->p_sps->i_buffer, p_sys->p_pps->p_buffer, p_sys->p_pps->i_buffer);
224 p_dec->pf_packetize = PacketizeAVC1;
228 /* This type of stream contains data with 3 of 4 byte startcodes
229 * The fmt_in.p_extra MAY contain SPS/PPS with 4 byte startcodes
230 * The fmt_out.p_extra should be the same */
233 p_dec->pf_packetize = Packetize;
236 if( p_dec->fmt_in.i_extra > 0 )
238 block_t *p_init = block_New( p_dec, p_dec->fmt_in.i_extra );
241 memcpy( p_init->p_buffer, p_dec->fmt_in.p_extra,
242 p_dec->fmt_in.i_extra );
244 while( ( p_pic = Packetize( p_dec, &p_init ) ) )
246 /* Should not occur because we should only receive SPS/PPS */
247 block_Release( p_pic );
255 /*****************************************************************************
256 * Close: clean up the packetizer
257 *****************************************************************************/
258 static void Close( vlc_object_t *p_this )
260 decoder_t *p_dec = (decoder_t*)p_this;
261 decoder_sys_t *p_sys = p_dec->p_sys;
263 if( p_sys->p_frame ) block_ChainRelease( p_sys->p_frame );
264 if( p_sys->p_sps ) block_Release( p_sys->p_sps );
265 if( p_sys->p_pps ) block_Release( p_sys->p_pps );
266 block_BytestreamRelease( &p_sys->bytestream );
270 /****************************************************************************
271 * Packetize: the whole thing
272 * Search for the startcodes 3 or more bytes
273 * Feed ParseNALBlock ALWAYS with 4 byte startcode prepended NALs
274 ****************************************************************************/
275 static block_t *Packetize( decoder_t *p_dec, block_t **pp_block )
277 decoder_sys_t *p_sys = p_dec->p_sys;
280 if( !pp_block || !*pp_block ) return NULL;
282 block_BytestreamPush( &p_sys->bytestream, *pp_block );
286 switch( p_sys->i_state )
289 /* Skip until 3 byte startcode 0 0 1 */
290 if( block_FindStartcodeFromOffset( &p_sys->bytestream,
291 &p_sys->i_offset, p_sys->startcode+1, 3 ) == VLC_SUCCESS)
293 p_sys->i_state = STATE_NEXT_SYNC;
296 if( p_sys->i_offset )
299 block_SkipBytes( &p_sys->bytestream, p_sys->i_offset );
301 block_BytestreamFlush( &p_sys->bytestream );
304 if( p_sys->i_state != STATE_NEXT_SYNC )
310 p_sys->i_offset = 1; /* To find next startcode */
312 case STATE_NEXT_SYNC:
313 /* Find the next 3 byte startcode 0 0 1*/
314 if( block_FindStartcodeFromOffset( &p_sys->bytestream,
315 &p_sys->i_offset, p_sys->startcode+1, 3 ) != VLC_SUCCESS)
321 /* Get the new fragment and set the pts/dts */
322 p_pic = block_New( p_dec, p_sys->i_offset +1 );
323 p_pic->i_pts = p_sys->bytestream.p_block->i_pts;
324 p_pic->i_dts = p_sys->bytestream.p_block->i_dts;
325 /* Force 4 byte startcode 0 0 0 1 */
326 p_pic->p_buffer[0] = 0;
328 block_GetBytes( &p_sys->bytestream, &p_pic->p_buffer[1],
331 /* Remove trailing 0 bytes */
332 while( p_pic->i_buffer && (!p_pic->p_buffer[p_pic->i_buffer-1] ) ) p_pic->i_buffer--;
336 if( !( p_pic = ParseNALBlock( p_dec, p_pic ) ) )
338 p_sys->i_state = STATE_NOSYNC;
342 msg_Dbg( p_dec, "pts="I64Fd" dts="I64Fd,
343 p_pic->i_pts, p_pic->i_dts );
346 /* So p_block doesn't get re-added several times */
347 *pp_block = block_BytestreamPop( &p_sys->bytestream );
349 p_sys->i_state = STATE_NOSYNC;
356 /****************************************************************************
357 * PacketizeAVC1: Takes VCL blocks of data and creates annexe B type NAL stream
358 * Will always use 4 byte 0 0 0 1 startcodes
359 * Will prepend a SPS and PPS before each keyframe
360 ****************************************************************************/
361 static block_t *PacketizeAVC1( decoder_t *p_dec, block_t **pp_block )
363 decoder_sys_t *p_sys = p_dec->p_sys;
365 block_t *p_ret = NULL;
368 if( !pp_block || !*pp_block ) return NULL;
373 for( p = p_block->p_buffer; p < &p_block->p_buffer[p_block->i_buffer]; )
379 for( i = 0; i < p_sys->i_avcC_length_size; i++ )
381 i_size = (i_size << 8) | (*p++);
386 block_t *p_part = nal_get_annexeb( p_dec, p, i_size );
388 p_part->i_dts = p_block->i_dts;
389 p_part->i_pts = p_block->i_pts;
392 if( ( p_pic = ParseNALBlock( p_dec, p_part ) ) )
394 block_ChainAppend( &p_ret, p_pic );
399 block_Release( p_block );
404 static block_t *nal_get_annexeb( decoder_t *p_dec, uint8_t *p, int i_size )
408 p_nal = block_New( p_dec, 4 + i_size );
411 p_nal->p_buffer[0] = 0x00;
412 p_nal->p_buffer[1] = 0x00;
413 p_nal->p_buffer[2] = 0x00;
414 p_nal->p_buffer[3] = 0x01;
417 memcpy( &p_nal->p_buffer[4], p, i_size );
422 static void nal_get_decoded( uint8_t **pp_ret, int *pi_ret,
423 uint8_t *src, int i_src )
425 uint8_t *end = &src[i_src];
426 uint8_t *dst = malloc( i_src );
432 if( src < end - 3 && src[0] == 0x00 && src[1] == 0x00 &&
444 *pi_ret = dst - *pp_ret;
447 static inline int bs_read_ue( bs_t *s )
451 while( bs_read1( s ) == 0 && s->p < s->p_end && i < 32 )
455 return( ( 1 << i) - 1 + bs_read( s, i ) );
458 static inline int bs_read_se( bs_t *s )
460 int val = bs_read_ue( s );
462 return val&0x01 ? (val+1)/2 : -(val/2);
466 /*****************************************************************************
467 * ParseNALBlock: parses annexB type NALs
468 * All p_frag blocks are required to start with 0 0 0 1 4-byte startcode
469 *****************************************************************************/
470 static block_t *ParseNALBlock( decoder_t *p_dec, block_t *p_frag )
472 decoder_sys_t *p_sys = p_dec->p_sys;
473 block_t *p_pic = NULL;
475 const int i_nal_ref_idc = (p_frag->p_buffer[4] >> 5)&0x03;
476 const int i_nal_type = p_frag->p_buffer[4]&0x1f;
480 p_pic = block_ChainGather( p_sys->p_frame ); \
481 p_pic->i_length = 0; /* FIXME */ \
482 p_pic->i_flags |= p_sys->i_frame_type; \
484 p_sys->i_frame_type = 0; \
485 p_sys->p_frame = NULL; \
486 p_sys->b_slice = VLC_FALSE; \
488 if( ( p_pic->i_flags & BLOCK_FLAG_TYPE_I ) && \
489 p_sys->p_sps && p_sys->p_pps ) \
491 block_t *p_sps = block_Duplicate( p_sys->p_sps ); \
492 block_t *p_pps = block_Duplicate( p_sys->p_pps ); \
493 p_sps->i_dts = p_pps->i_dts = p_pic->i_dts; \
494 p_sps->i_pts = p_pps->i_pts = p_pic->i_pts; \
495 block_ChainAppend( &p_sps, p_pps ); \
496 block_ChainAppend( &p_sps, p_pic ); \
497 p_pic = block_ChainGather( p_sps ); \
502 if( p_sys->b_slice && !p_sys->b_sps )
504 block_ChainRelease( p_sys->p_frame );
505 msg_Warn( p_dec, "waiting for SPS" );
508 p_sys->p_frame = NULL;
509 p_sys->b_slice = VLC_FALSE;
513 i_nal_type >= NAL_SLICE && i_nal_type <= NAL_SLICE_IDR )
515 p_sys->b_slice = VLC_TRUE;
516 /* Fragment will be discarded later on */
518 else if( i_nal_type >= NAL_SLICE && i_nal_type <= NAL_SLICE_IDR )
521 int i_dec, i_first_mb, i_slice_type, i_frame_num;
522 vlc_bool_t b_pic = VLC_FALSE;
525 /* do not convert the whole frame */
526 nal_get_decoded( &dec, &i_dec, &p_frag->p_buffer[5],
527 __MIN( p_frag->i_buffer - 5, 60 ) );
528 bs_init( &s, dec, i_dec );
530 /* first_mb_in_slice */
531 i_first_mb = bs_read_ue( &s );
534 switch( (i_slice_type = bs_read_ue( &s )) )
537 p_sys->i_frame_type = BLOCK_FLAG_TYPE_P;
540 p_sys->i_frame_type = BLOCK_FLAG_TYPE_B;
543 p_sys->i_frame_type = BLOCK_FLAG_TYPE_I;
545 case 3: case 8: /* SP */
546 p_sys->i_frame_type = BLOCK_FLAG_TYPE_P;
549 p_sys->i_frame_type = BLOCK_FLAG_TYPE_I;
553 /* pic_parameter_set_id */
556 i_frame_num = bs_read( &s, p_sys->i_log2_max_frame_num + 4 );
558 /* Detection of the first VCL NAL unit of a primary coded picture
560 if( i_frame_num != p_sys->i_frame_num ||
561 ( (i_nal_ref_idc != p_sys->i_nal_ref_idc) &&
562 (!i_nal_ref_idc || !p_sys->i_nal_ref_idc) ) )
566 p_sys->i_frame_num = i_frame_num;
567 p_sys->i_nal_ref_idc = i_nal_ref_idc;
569 if( !p_sys->b_frame_mbs_only )
572 if( bs_read( &s, 1 ) )
574 /* bottom_field_flag */
579 if( i_nal_type == NAL_SLICE_IDR )
582 int i_idr_pic_id = bs_read_ue( &s );
583 if( p_sys->i_nal_type != i_nal_type ) b_pic = VLC_TRUE;
584 if( p_sys->i_idr_pic_id != i_idr_pic_id ) b_pic = VLC_TRUE;
585 p_sys->i_idr_pic_id = i_idr_pic_id;
587 p_sys->i_nal_type = i_nal_type;
589 if( b_pic && p_sys->b_slice ) OUTPUT;
591 p_sys->b_slice = VLC_TRUE;
595 else if( i_nal_type == NAL_SPS )
602 if( !p_sys->b_sps ) msg_Dbg( p_dec, "found NAL_SPS" );
604 p_sys->b_sps = VLC_TRUE;
606 nal_get_decoded( &dec, &i_dec, &p_frag->p_buffer[5],
607 p_frag->i_buffer - 5 );
609 bs_init( &s, dec, i_dec );
610 /* Skip profile(8), constraint_set012, reserver(5), level(8) */
611 bs_skip( &s, 8 + 1+1+1 + 5 + 8 );
614 /* Skip i_log2_max_frame_num */
615 p_sys->i_log2_max_frame_num = bs_read_ue( &s );
617 i_tmp = bs_read_ue( &s );
620 /* skip i_log2_max_poc_lsb */
623 else if( i_tmp == 1 )
626 /* skip b_delta_pic_order_always_zero */
628 /* skip i_offset_for_non_ref_pic */
630 /* skip i_offset_for_top_to_bottom_field */
632 /* read i_num_ref_frames_in_poc_cycle */
633 i_cycle = bs_read_ue( &s );
634 if( i_cycle > 256 ) i_cycle = 256;
637 /* skip i_offset_for_ref_frame */
641 /* i_num_ref_frames */
643 /* b_gaps_in_frame_num_value_allowed */
647 p_dec->fmt_out.video.i_width = 16 * ( bs_read_ue( &s ) + 1 );
648 p_dec->fmt_out.video.i_height = 16 * ( bs_read_ue( &s ) + 1 );
650 /* b_frame_mbs_only */
651 p_sys->b_frame_mbs_only = bs_read( &s, 1 );
652 if( p_sys->b_frame_mbs_only == 0 )
656 /* b_direct8x8_inference */
660 i_tmp = bs_read( &s, 1 );
674 i_tmp = bs_read( &s, 1 );
677 /* read the aspect ratio part if any FIXME check it */
678 i_tmp = bs_read( &s, 1 );
681 static const struct { int w, h; } sar[14] =
683 { 0, 0 }, { 1, 1 }, { 12, 11 }, { 10, 11 },
684 { 16, 11 }, { 40, 33 }, { 24, 11 }, { 20, 11 },
685 { 32, 11 }, { 80, 33 }, { 18, 11 }, { 15, 11 },
686 { 64, 33 }, { 160,99 },
688 int i_sar = bs_read( &s, 8 );
698 w = bs_read( &s, 16 );
699 h = bs_read( &s, 16 );
702 p_dec->fmt_out.video.i_aspect = VOUT_ASPECT_FACTOR * w /
703 h * p_dec->fmt_out.video.i_width /
704 p_dec->fmt_out.video.i_height;
706 p_dec->fmt_out.video.i_aspect = VOUT_ASPECT_FACTOR;
712 if( p_sys->b_slice ) OUTPUT;
714 /* We have a new SPS */
715 if( p_sys->p_sps ) block_Release( p_sys->p_sps );
716 p_sys->p_sps = p_frag;
718 /* Do not append the SPS because we will insert it on keyframes */
721 else if( i_nal_type == NAL_PPS )
724 bs_init( &s, &p_frag->p_buffer[5], p_frag->i_buffer - 5 );
726 if( !p_sys->b_pps ) msg_Dbg( p_dec, "found NAL_PPS" );
727 p_sys->b_pps = VLC_TRUE;
731 if( p_sys->b_slice ) OUTPUT;
733 /* We have a new PPS */
734 if( p_sys->p_pps ) block_Release( p_sys->p_pps );
735 p_sys->p_pps = p_frag;
737 /* Do not append the PPS because we will insert it on keyframes */
740 else if( i_nal_type == NAL_AU_DELIMITER ||
741 i_nal_type == NAL_SEI ||
742 ( i_nal_type >= 13 && i_nal_type <= 18 ) )
744 if( p_sys->b_slice ) OUTPUT;
749 /* Append the block */
750 block_ChainAppend( &p_sys->p_frame, p_frag );