1 /*****************************************************************************
2 * h264.c: h264/avc video packetizer
3 *****************************************************************************
4 * Copyright (C) 2001, 2002, 2006 the VideoLAN team
7 * Authors: Laurent Aimar <fenrir@via.ecp.fr>
8 * Eric Petit <titer@videolan.org>
9 * Gildas Bazin <gbazin@videolan.org>
11 * This program is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU General Public License as published by
13 * the Free Software Foundation; either version 2 of the License, or
14 * (at your option) any later version.
16 * This program is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19 * GNU General Public License for more details.
21 * You should have received a copy of the GNU General Public License
22 * along with this program; if not, write to the Free Software
23 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
24 *****************************************************************************/
26 /*****************************************************************************
28 *****************************************************************************/
29 #include <stdlib.h> /* malloc(), free() */
32 #include <vlc/decoder.h>
35 #include "vlc_block_helper.h"
38 /*****************************************************************************
40 *****************************************************************************/
41 static int Open ( vlc_object_t * );
42 static void Close( vlc_object_t * );
45 set_category( CAT_SOUT );
46 set_subcategory( SUBCAT_SOUT_PACKETIZER );
47 set_description( _("H.264 video packetizer") );
48 set_capability( "packetizer", 50 );
49 set_callbacks( Open, Close );
53 /****************************************************************************
55 ****************************************************************************/
56 static block_t *Packetize( decoder_t *, block_t ** );
57 static block_t *PacketizeAVC1( decoder_t *, block_t ** );
61 block_bytestream_t bytestream;
74 int i_avcC_length_size;
78 /* Useful values of the Sequence Parameter Set */
79 int i_log2_max_frame_num;
82 /* Useful values of the Slice Header */
103 NAL_SLICE_IDR = 5, /* ref_idc != 0 */
104 NAL_SEI = 6, /* ref_idc == 0 */
108 /* ref_idc == 0 for 6,9,10,11,12 */
113 NAL_PRIORITY_DISPOSABLE = 0,
114 NAL_PRIORITY_LOW = 1,
115 NAL_PRIORITY_HIGH = 2,
116 NAL_PRIORITY_HIGHEST = 3,
119 static block_t *ParseNALBlock( decoder_t *, block_t * );
121 static block_t *nal_get_annexeb( decoder_t *, uint8_t *p, int );
123 /*****************************************************************************
124 * Open: probe the packetizer and return score
125 * When opening after demux, the packetizer is only loaded AFTER the decoder
126 * That means that what you set in fmt_out is ignored by the decoder in this special case
127 *****************************************************************************/
128 static int Open( vlc_object_t *p_this )
130 decoder_t *p_dec = (decoder_t*)p_this;
131 decoder_sys_t *p_sys;
133 if( p_dec->fmt_in.i_codec != VLC_FOURCC( 'h', '2', '6', '4') &&
134 p_dec->fmt_in.i_codec != VLC_FOURCC( 'H', '2', '6', '4') &&
135 p_dec->fmt_in.i_codec != VLC_FOURCC( 'V', 'S', 'S', 'H') &&
136 p_dec->fmt_in.i_codec != VLC_FOURCC( 'v', 's', 's', 'h') &&
137 p_dec->fmt_in.i_codec != VLC_FOURCC( 'D', 'A', 'V', 'C') &&
138 ( p_dec->fmt_in.i_codec != VLC_FOURCC( 'a', 'v', 'c', '1') ||
139 p_dec->fmt_in.i_extra < 7 ) )
144 /* Allocate the memory needed to store the decoder's structure */
145 if( ( p_dec->p_sys = p_sys = malloc( sizeof(decoder_sys_t) ) ) == NULL )
147 msg_Err( p_dec, "out of memory" );
150 p_sys->i_state = STATE_NOSYNC;
152 p_sys->startcode[0] = 0;
153 p_sys->startcode[1] = 0;
154 p_sys->startcode[2] = 0;
155 p_sys->startcode[3] = 1;
156 p_sys->bytestream = block_BytestreamInit( p_dec );
157 p_sys->b_slice = VLC_FALSE;
158 p_sys->p_frame = NULL;
159 p_sys->b_sps = VLC_FALSE;
160 p_sys->b_pps = VLC_FALSE;
164 p_sys->i_nal_type = -1;
165 p_sys->i_nal_ref_idc = -1;
166 p_sys->i_idr_pic_id = -1;
167 p_sys->i_frame_num = -1;
168 p_sys->i_frame_type = 0;
170 /* Setup properties */
171 es_format_Copy( &p_dec->fmt_out, &p_dec->fmt_in );
172 p_dec->fmt_out.i_codec = VLC_FOURCC( 'h', '2', '6', '4' );
174 if( p_dec->fmt_in.i_codec == VLC_FOURCC( 'a', 'v', 'c', '1' ) )
176 /* This type of stream is produced by mp4 and matroska
177 * when we want to store it in another streamformat, you need to convert
178 * The fmt_in.p_extra should ALWAYS contain the avcC
179 * The fmt_out.p_extra should contain all the SPS and PPS with 4 byte startcodes */
180 uint8_t *p = &((uint8_t*)p_dec->fmt_in.p_extra)[4];
185 p_sys->i_avcC_length_size = 1 + ((*p++)&0x03);
189 for( i = 0; i < i_sps; i++ )
191 int i_length = GetWBE( p );
192 block_t *p_sps = nal_get_annexeb( p_dec, p + 2, i_length );
194 p_sys->p_sps = block_Duplicate( p_sps );
195 p_sps->i_pts = p_sps->i_dts = mdate();
196 ParseNALBlock( p_dec, p_sps );
201 for( i = 0; i < i_pps; i++ )
203 int i_length = GetWBE( p );
204 block_t *p_pps = nal_get_annexeb( p_dec, p + 2, i_length );
206 p_sys->p_pps = block_Duplicate( p_pps );
207 p_pps->i_pts = p_pps->i_dts = mdate();
208 ParseNALBlock( p_dec, p_pps );
211 msg_Dbg( p_dec, "avcC length size=%d, sps=%d, pps=%d",
212 p_sys->i_avcC_length_size, i_sps, i_pps );
214 /* FIXME: FFMPEG isn't happy at all if you leave this */
215 if( p_dec->fmt_out.i_extra ) free( p_dec->fmt_out.p_extra );
216 p_dec->fmt_out.i_extra = 0; p_dec->fmt_out.p_extra = NULL;
218 /* Set the new extradata */
219 p_dec->fmt_out.i_extra = p_sys->p_pps->i_buffer + p_sys->p_sps->i_buffer;
220 p_dec->fmt_out.p_extra = (uint8_t*)malloc( p_dec->fmt_out.i_extra );
221 memcpy( p_dec->fmt_out.p_extra, p_sys->p_sps->p_buffer, p_sys->p_sps->i_buffer);
222 memcpy( p_dec->fmt_out.p_extra+p_sys->p_sps->i_buffer, p_sys->p_pps->p_buffer, p_sys->p_pps->i_buffer);
225 p_dec->pf_packetize = PacketizeAVC1;
229 /* This type of stream contains data with 3 of 4 byte startcodes
230 * The fmt_in.p_extra MAY contain SPS/PPS with 4 byte startcodes
231 * The fmt_out.p_extra should be the same */
234 p_dec->pf_packetize = Packetize;
237 if( p_dec->fmt_in.i_extra > 0 )
239 block_t *p_init = block_New( p_dec, p_dec->fmt_in.i_extra );
242 memcpy( p_init->p_buffer, p_dec->fmt_in.p_extra,
243 p_dec->fmt_in.i_extra );
245 while( ( p_pic = Packetize( p_dec, &p_init ) ) )
247 /* Should not occur because we should only receive SPS/PPS */
248 block_Release( p_pic );
256 /*****************************************************************************
257 * Close: clean up the packetizer
258 *****************************************************************************/
259 static void Close( vlc_object_t *p_this )
261 decoder_t *p_dec = (decoder_t*)p_this;
262 decoder_sys_t *p_sys = p_dec->p_sys;
264 if( p_sys->p_frame ) block_ChainRelease( p_sys->p_frame );
265 if( p_sys->p_sps ) block_Release( p_sys->p_sps );
266 if( p_sys->p_pps ) block_Release( p_sys->p_pps );
267 block_BytestreamRelease( &p_sys->bytestream );
271 /****************************************************************************
272 * Packetize: the whole thing
273 * Search for the startcodes 3 or more bytes
274 * Feed ParseNALBlock ALWAYS with 4 byte startcode prepended NALs
275 ****************************************************************************/
276 static block_t *Packetize( decoder_t *p_dec, block_t **pp_block )
278 decoder_sys_t *p_sys = p_dec->p_sys;
281 if( !pp_block || !*pp_block ) return NULL;
283 block_BytestreamPush( &p_sys->bytestream, *pp_block );
287 switch( p_sys->i_state )
290 /* Skip until 3 byte startcode 0 0 1 */
291 if( block_FindStartcodeFromOffset( &p_sys->bytestream,
292 &p_sys->i_offset, p_sys->startcode+1, 3 ) == VLC_SUCCESS)
294 p_sys->i_state = STATE_NEXT_SYNC;
297 if( p_sys->i_offset )
300 block_SkipBytes( &p_sys->bytestream, p_sys->i_offset );
302 block_BytestreamFlush( &p_sys->bytestream );
305 if( p_sys->i_state != STATE_NEXT_SYNC )
311 p_sys->i_offset = 1; /* To find next startcode */
313 case STATE_NEXT_SYNC:
314 /* Find the next 3 byte startcode 0 0 1*/
315 if( block_FindStartcodeFromOffset( &p_sys->bytestream,
316 &p_sys->i_offset, p_sys->startcode+1, 3 ) != VLC_SUCCESS)
322 /* Get the new fragment and set the pts/dts */
323 p_pic = block_New( p_dec, p_sys->i_offset +1 );
324 p_pic->i_pts = p_sys->bytestream.p_block->i_pts;
325 p_pic->i_dts = p_sys->bytestream.p_block->i_dts;
326 /* Force 4 byte startcode 0 0 0 1 */
327 p_pic->p_buffer[0] = 0;
329 block_GetBytes( &p_sys->bytestream, &p_pic->p_buffer[1],
332 /* Remove trailing 0 bytes */
333 while( p_pic->i_buffer && (!p_pic->p_buffer[p_pic->i_buffer-1] ) ) p_pic->i_buffer--;
337 if( !( p_pic = ParseNALBlock( p_dec, p_pic ) ) )
339 p_sys->i_state = STATE_NOSYNC;
343 msg_Dbg( p_dec, "pts="I64Fd" dts="I64Fd,
344 p_pic->i_pts, p_pic->i_dts );
347 /* So p_block doesn't get re-added several times */
348 *pp_block = block_BytestreamPop( &p_sys->bytestream );
350 p_sys->i_state = STATE_NOSYNC;
357 /****************************************************************************
358 * PacketizeAVC1: Takes VCL blocks of data and creates annexe B type NAL stream
359 * Will always use 4 byte 0 0 0 1 startcodes
360 * Will prepend a SPS and PPS before each keyframe
361 ****************************************************************************/
362 static block_t *PacketizeAVC1( decoder_t *p_dec, block_t **pp_block )
364 decoder_sys_t *p_sys = p_dec->p_sys;
366 block_t *p_ret = NULL;
369 if( !pp_block || !*pp_block ) return NULL;
374 for( p = p_block->p_buffer; p < &p_block->p_buffer[p_block->i_buffer]; )
380 for( i = 0; i < p_sys->i_avcC_length_size; i++ )
382 i_size = (i_size << 8) | (*p++);
387 block_t *p_part = nal_get_annexeb( p_dec, p, i_size );
389 p_part->i_dts = p_block->i_dts;
390 p_part->i_pts = p_block->i_pts;
393 if( ( p_pic = ParseNALBlock( p_dec, p_part ) ) )
395 block_ChainAppend( &p_ret, p_pic );
400 block_Release( p_block );
405 static block_t *nal_get_annexeb( decoder_t *p_dec, uint8_t *p, int i_size )
409 p_nal = block_New( p_dec, 4 + i_size );
412 p_nal->p_buffer[0] = 0x00;
413 p_nal->p_buffer[1] = 0x00;
414 p_nal->p_buffer[2] = 0x00;
415 p_nal->p_buffer[3] = 0x01;
418 memcpy( &p_nal->p_buffer[4], p, i_size );
423 static void nal_get_decoded( uint8_t **pp_ret, int *pi_ret,
424 uint8_t *src, int i_src )
426 uint8_t *end = &src[i_src];
427 uint8_t *dst = malloc( i_src );
433 if( src < end - 3 && src[0] == 0x00 && src[1] == 0x00 &&
445 *pi_ret = dst - *pp_ret;
448 static inline int bs_read_ue( bs_t *s )
452 while( bs_read1( s ) == 0 && s->p < s->p_end && i < 32 )
456 return( ( 1 << i) - 1 + bs_read( s, i ) );
459 static inline int bs_read_se( bs_t *s )
461 int val = bs_read_ue( s );
463 return val&0x01 ? (val+1)/2 : -(val/2);
467 /*****************************************************************************
468 * ParseNALBlock: parses annexB type NALs
469 * All p_frag blocks are required to start with 0 0 0 1 4-byte startcode
470 *****************************************************************************/
471 static block_t *ParseNALBlock( decoder_t *p_dec, block_t *p_frag )
473 decoder_sys_t *p_sys = p_dec->p_sys;
474 block_t *p_pic = NULL;
476 const int i_nal_ref_idc = (p_frag->p_buffer[4] >> 5)&0x03;
477 const int i_nal_type = p_frag->p_buffer[4]&0x1f;
481 p_pic = block_ChainGather( p_sys->p_frame ); \
482 p_pic->i_length = 0; /* FIXME */ \
483 p_pic->i_flags |= p_sys->i_frame_type; \
485 p_sys->i_frame_type = 0; \
486 p_sys->p_frame = NULL; \
487 p_sys->b_slice = VLC_FALSE; \
489 if( ( p_pic->i_flags & BLOCK_FLAG_TYPE_I ) && \
490 p_sys->p_sps && p_sys->p_pps ) \
492 block_t *p_sps = block_Duplicate( p_sys->p_sps ); \
493 block_t *p_pps = block_Duplicate( p_sys->p_pps ); \
494 p_sps->i_dts = p_pps->i_dts = p_pic->i_dts; \
495 p_sps->i_pts = p_pps->i_pts = p_pic->i_pts; \
496 block_ChainAppend( &p_sps, p_pps ); \
497 block_ChainAppend( &p_sps, p_pic ); \
498 p_pic = block_ChainGather( p_sps ); \
503 if( p_sys->b_slice && !p_sys->b_sps )
505 block_ChainRelease( p_sys->p_frame );
506 msg_Warn( p_dec, "waiting for SPS" );
509 p_sys->p_frame = NULL;
510 p_sys->b_slice = VLC_FALSE;
514 i_nal_type >= NAL_SLICE && i_nal_type <= NAL_SLICE_IDR )
516 p_sys->b_slice = VLC_TRUE;
517 /* Fragment will be discarded later on */
519 else if( i_nal_type >= NAL_SLICE && i_nal_type <= NAL_SLICE_IDR )
522 int i_dec, i_first_mb, i_slice_type, i_frame_num;
523 vlc_bool_t b_pic = VLC_FALSE;
526 /* do not convert the whole frame */
527 nal_get_decoded( &dec, &i_dec, &p_frag->p_buffer[5],
528 __MIN( p_frag->i_buffer - 5, 60 ) );
529 bs_init( &s, dec, i_dec );
531 /* first_mb_in_slice */
532 i_first_mb = bs_read_ue( &s );
535 switch( (i_slice_type = bs_read_ue( &s )) )
538 p_sys->i_frame_type = BLOCK_FLAG_TYPE_P;
541 p_sys->i_frame_type = BLOCK_FLAG_TYPE_B;
544 p_sys->i_frame_type = BLOCK_FLAG_TYPE_I;
546 case 3: case 8: /* SP */
547 p_sys->i_frame_type = BLOCK_FLAG_TYPE_P;
550 p_sys->i_frame_type = BLOCK_FLAG_TYPE_I;
554 /* pic_parameter_set_id */
557 i_frame_num = bs_read( &s, p_sys->i_log2_max_frame_num + 4 );
559 /* Detection of the first VCL NAL unit of a primary coded picture
561 if( i_frame_num != p_sys->i_frame_num ||
562 ( (i_nal_ref_idc != p_sys->i_nal_ref_idc) &&
563 (!i_nal_ref_idc || !p_sys->i_nal_ref_idc) ) )
567 p_sys->i_frame_num = i_frame_num;
568 p_sys->i_nal_ref_idc = i_nal_ref_idc;
570 if( !p_sys->b_frame_mbs_only )
573 if( bs_read( &s, 1 ) )
575 /* bottom_field_flag */
580 if( i_nal_type == NAL_SLICE_IDR )
583 int i_idr_pic_id = bs_read_ue( &s );
584 if( p_sys->i_nal_type != i_nal_type ) b_pic = VLC_TRUE;
585 if( p_sys->i_idr_pic_id != i_idr_pic_id ) b_pic = VLC_TRUE;
586 p_sys->i_idr_pic_id = i_idr_pic_id;
588 p_sys->i_nal_type = i_nal_type;
590 if( b_pic && p_sys->b_slice ) OUTPUT;
592 p_sys->b_slice = VLC_TRUE;
596 else if( i_nal_type == NAL_SPS )
603 if( !p_sys->b_sps ) msg_Dbg( p_dec, "found NAL_SPS" );
605 p_sys->b_sps = VLC_TRUE;
607 nal_get_decoded( &dec, &i_dec, &p_frag->p_buffer[5],
608 p_frag->i_buffer - 5 );
610 bs_init( &s, dec, i_dec );
611 /* Skip profile(8), constraint_set012, reserver(5), level(8) */
612 bs_skip( &s, 8 + 1+1+1 + 5 + 8 );
615 /* Skip i_log2_max_frame_num */
616 p_sys->i_log2_max_frame_num = bs_read_ue( &s );
618 i_tmp = bs_read_ue( &s );
621 /* skip i_log2_max_poc_lsb */
624 else if( i_tmp == 1 )
627 /* skip b_delta_pic_order_always_zero */
629 /* skip i_offset_for_non_ref_pic */
631 /* skip i_offset_for_top_to_bottom_field */
633 /* read i_num_ref_frames_in_poc_cycle */
634 i_cycle = bs_read_ue( &s );
635 if( i_cycle > 256 ) i_cycle = 256;
638 /* skip i_offset_for_ref_frame */
642 /* i_num_ref_frames */
644 /* b_gaps_in_frame_num_value_allowed */
648 p_dec->fmt_out.video.i_width = 16 * ( bs_read_ue( &s ) + 1 );
649 p_dec->fmt_out.video.i_height = 16 * ( bs_read_ue( &s ) + 1 );
651 /* b_frame_mbs_only */
652 p_sys->b_frame_mbs_only = bs_read( &s, 1 );
653 if( p_sys->b_frame_mbs_only == 0 )
657 /* b_direct8x8_inference */
661 i_tmp = bs_read( &s, 1 );
675 i_tmp = bs_read( &s, 1 );
678 /* read the aspect ratio part if any FIXME check it */
679 i_tmp = bs_read( &s, 1 );
682 static const struct { int w, h; } sar[14] =
684 { 0, 0 }, { 1, 1 }, { 12, 11 }, { 10, 11 },
685 { 16, 11 }, { 40, 33 }, { 24, 11 }, { 20, 11 },
686 { 32, 11 }, { 80, 33 }, { 18, 11 }, { 15, 11 },
687 { 64, 33 }, { 160,99 },
689 int i_sar = bs_read( &s, 8 );
699 w = bs_read( &s, 16 );
700 h = bs_read( &s, 16 );
703 p_dec->fmt_out.video.i_aspect = VOUT_ASPECT_FACTOR * w /
704 h * p_dec->fmt_out.video.i_width /
705 p_dec->fmt_out.video.i_height;
707 p_dec->fmt_out.video.i_aspect = VOUT_ASPECT_FACTOR;
713 if( p_sys->b_slice ) OUTPUT;
715 /* We have a new SPS */
716 if( p_sys->p_sps ) block_Release( p_sys->p_sps );
717 p_sys->p_sps = p_frag;
719 /* Do not append the SPS because we will insert it on keyframes */
722 else if( i_nal_type == NAL_PPS )
725 bs_init( &s, &p_frag->p_buffer[5], p_frag->i_buffer - 5 );
727 if( !p_sys->b_pps ) msg_Dbg( p_dec, "found NAL_PPS" );
728 p_sys->b_pps = VLC_TRUE;
732 if( p_sys->b_slice ) OUTPUT;
734 /* We have a new PPS */
735 if( p_sys->p_pps ) block_Release( p_sys->p_pps );
736 p_sys->p_pps = p_frag;
738 /* Do not append the PPS because we will insert it on keyframes */
741 else if( i_nal_type == NAL_AU_DELIMITER ||
742 i_nal_type == NAL_SEI ||
743 ( i_nal_type >= 13 && i_nal_type <= 18 ) )
745 if( p_sys->b_slice ) OUTPUT;
750 /* Append the block */
751 block_ChainAppend( &p_sys->p_frame, p_frag );