1 /*****************************************************************************
2 * asx.c : ASX playlist format import
3 *****************************************************************************
4 * Copyright (C) 2005-2006 the VideoLAN team
7 * Authors: Derk-Jan Hartman <hartman at videolan dot org>
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License as published by
11 * the Free Software Foundation; either version 2 of the License, or
12 * (at your option) any later version.
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
19 * You should have received a copy of the GNU General Public License
20 * along with this program; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
22 *****************************************************************************/
24 /* See also: http://msdn.microsoft.com/library/en-us/wmplay10/mmp_sdk/windowsmediametafilereference.asp
27 /*****************************************************************************
29 *****************************************************************************/
34 #include <vlc_common.h>
35 #include <vlc_demux.h>
38 #include <vlc_charset.h>
51 /*****************************************************************************
53 *****************************************************************************/
54 static int Demux( demux_t *p_demux);
55 static int Control( demux_t *p_demux, int i_query, va_list args );
57 static int StoreString( demux_t *p_demux, char **ppsz_string,
58 const char *psz_source_start,
59 const char *psz_source_end )
61 demux_sys_t *p_sys = p_demux->p_sys;
62 unsigned len = psz_source_end - psz_source_start;
66 char *buf = *ppsz_string = malloc ((len * (1 + !p_sys->b_utf8)) + 1);
72 memcpy (buf, psz_source_start, len);
73 (*ppsz_string)[len] = '\0';
74 EnsureUTF8 (*ppsz_string);
78 /* Latin-1 -> UTF-8 */
79 for (unsigned i = 0; i < len; i++)
81 unsigned char c = psz_source_start[i];
84 *buf++ = 0xc0 | (c >> 6);
85 *buf++ = 0x80 | (c & 0x3f);
92 buf = *ppsz_string = realloc (*ppsz_string, buf - *ppsz_string);
97 static char *SkipBlanks(char *s, size_t i_strlen )
99 while( i_strlen > 0 ) {
116 static int ParseTime(char *s, size_t i_strlen)
118 // need to parse hour:minutes:sec.fraction string
121 const char *end = s + i_strlen;
122 // skip leading spaces if any
123 s = SkipBlanks(s, i_strlen);
126 while( (s < end) && isdigit(*s) )
128 int newval = val*10 + (*s - '0');
139 s = SkipBlanks(s, end-s);
143 s = SkipBlanks(s, end-s);
144 result = result * 60;
146 while( (s < end) && isdigit(*s) )
148 int newval = val*10 + (*s - '0');
159 s = SkipBlanks(s, end-s);
163 s = SkipBlanks(s, end-s);
164 result = result * 60;
166 while( (s < end) && isdigit(*s) )
168 int newval = val*10 + (*s - '0');
179 // TODO: one day, we may need to parse fraction for sub-second resolution
185 /*****************************************************************************
186 * Import_ASX: main import function
187 *****************************************************************************/
188 int Import_ASX( vlc_object_t *p_this )
190 demux_t *p_demux = (demux_t *)p_this;
191 const uint8_t *p_peek;
192 CHECK_PEEK( p_peek, 10 );
194 // skip over possible leading empty lines and empty spaces
195 p_peek = (uint8_t *)SkipBlanks((char *)p_peek, 6);
197 if( POKE( p_peek, "<asx", 4 ) || demux_IsPathExtension( p_demux, ".asx" ) ||
198 demux_IsPathExtension( p_demux, ".wax" ) || demux_IsPathExtension( p_demux, ".wvx" ) ||
199 demux_IsForced( p_demux, "asx-open" ) )
206 STANDARD_DEMUX_INIT_MSG( "found valid ASX playlist" );
207 p_demux->p_sys->psz_prefix = FindPrefix( p_demux );
208 p_demux->p_sys->psz_data = NULL;
209 p_demux->p_sys->i_data_len = -1;
210 p_demux->p_sys->b_utf8 = false;
211 p_demux->p_sys->b_skip_ads = config_GetInt( p_demux, "playlist-skip-ads" );
216 /*****************************************************************************
217 * Deactivate: frees unused data
218 *****************************************************************************/
219 void Close_ASX( vlc_object_t *p_this )
221 demux_t *p_demux = (demux_t *)p_this;
222 demux_sys_t *p_sys = p_demux->p_sys;
224 free( p_sys->psz_prefix );
225 free( p_sys->psz_data );
229 static int Demux( demux_t *p_demux )
231 demux_sys_t *p_sys = p_demux->p_sys;
232 char *psz_parse = NULL;
233 char *psz_backup = NULL;
234 bool b_entry = false;
238 if( p_sys->i_data_len < 0 )
241 p_sys->i_data_len = stream_Size( p_demux->s ) +1; /* This is a cheat to prevent unnecessary realloc */
242 if( p_sys->i_data_len <= 0 && p_sys->i_data_len < 16384 ) p_sys->i_data_len = 1024;
243 p_sys->psz_data = malloc( p_sys->i_data_len +1);
245 /* load the complete file */
248 int i_read = stream_Read( p_demux->s, &p_sys->psz_data[i_pos], p_sys->i_data_len - i_pos );
249 p_sys->psz_data[i_pos + i_read] = '\0';
251 if( i_read < p_sys->i_data_len - i_pos ) break; /* Done */
254 p_sys->i_data_len += 1024;
255 p_sys->psz_data = realloc( p_sys->psz_data, p_sys->i_data_len * sizeof( char * ) +1 );
257 if( p_sys->i_data_len <= 0 ) return -1;
260 psz_parse = p_sys->psz_data;
261 /* Find first element */
262 if( ( psz_parse = strcasestr( psz_parse, "<ASX" ) ) )
265 char *psz_string = NULL;
268 char *psz_base_asx = NULL;
269 char *psz_title_asx = NULL;
270 char *psz_artist_asx = NULL;
271 char *psz_copyright_asx = NULL;
272 char *psz_moreinfo_asx = NULL;
273 char *psz_abstract_asx = NULL;
275 char *psz_base_entry = NULL;
276 char *psz_title_entry = NULL;
277 char *psz_artist_entry = NULL;
278 char *psz_copyright_entry = NULL;
279 char *psz_moreinfo_entry = NULL;
280 char *psz_abstract_entry = NULL;
281 int i_entry_count = 0;
282 bool b_skip_entry = false;
284 char *psz_href = NULL;
288 psz_parse = strcasestr( psz_parse, ">" );
290 while( psz_parse && ( psz_parse = strcasestr( psz_parse, "<" ) ) )
292 if( !strncasecmp( psz_parse, "<!--", 4 ) )
294 /* this is a comment */
295 if( ( psz_parse = strcasestr( psz_parse, "-->" ) ) )
299 else if( !strncasecmp( psz_parse, "<PARAM ", 7 ) )
301 bool b_encoding_flag = false;
302 psz_parse = SkipBlanks(psz_parse+7, (unsigned)-1);
303 if( !strncasecmp( psz_parse, "name", 4 ) )
305 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
307 psz_backup = ++psz_parse;
308 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
310 i_strlen = psz_parse-psz_backup;
311 if( i_strlen < 1 ) continue;
312 msg_Dbg( p_demux, "param name strlen: %d", i_strlen);
313 psz_string = malloc( i_strlen + 1);
314 memcpy( psz_string, psz_backup, i_strlen );
315 psz_string[i_strlen] = '\0';
316 msg_Dbg( p_demux, "param name: %s", psz_string);
317 b_encoding_flag = !strcasecmp( psz_string, "encoding" );
325 if( !strncasecmp( psz_parse, "value", 5 ) )
327 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
329 psz_backup = ++psz_parse;
330 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
332 i_strlen = psz_parse-psz_backup;
333 if( i_strlen < 1 ) continue;
334 msg_Dbg( p_demux, "param value strlen: %d", i_strlen);
335 psz_string = malloc( i_strlen +1);
336 memcpy( psz_string, psz_backup, i_strlen );
337 psz_string[i_strlen] = '\0';
338 msg_Dbg( p_demux, "param value: %s", psz_string);
339 if( b_encoding_flag && !strcasecmp( psz_string, "utf-8" ) ) p_sys->b_utf8 = true;
346 if( ( psz_parse = strcasestr( psz_parse, "/>" ) ) )
350 else if( !strncasecmp( psz_parse, "<BANNER", 7 ) )
352 /* We skip this element */
353 if( ( psz_parse = strcasestr( psz_parse, "</BANNER>" ) ) )
357 else if( !strncasecmp( psz_parse, "<PREVIEWDURATION", 16 ) ||
358 !strncasecmp( psz_parse, "<LOGURL", 7 ) ||
359 !strncasecmp( psz_parse, "<Skin", 5 ) )
361 /* We skip this element */
362 if( ( psz_parse = strcasestr( psz_parse, "/>" ) ) )
366 else if( !strncasecmp( psz_parse, "<BASE ", 6 ) )
368 psz_parse = SkipBlanks(psz_parse+6, (unsigned)-1);
369 if( !strncasecmp( psz_parse, "HREF", 4 ) )
371 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
373 psz_backup = ++psz_parse;
374 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
376 StoreString( p_demux, (b_entry ? &psz_base_entry : &psz_base_asx), psz_backup, psz_parse );
382 if( ( psz_parse = strcasestr( psz_parse, "/>" ) ) )
386 else if( !strncasecmp( psz_parse, "<TITLE>", 7 ) )
388 psz_backup = psz_parse+=7;
389 if( ( psz_parse = strcasestr( psz_parse, "</TITLE>" ) ) )
391 StoreString( p_demux, (b_entry ? &psz_title_entry : &psz_title_asx), psz_backup, psz_parse );
396 else if( !strncasecmp( psz_parse, "<Author>", 8 ) )
398 psz_backup = psz_parse+=8;
399 if( ( psz_parse = strcasestr( psz_parse, "</Author>" ) ) )
401 StoreString( p_demux, (b_entry ? &psz_artist_entry : &psz_artist_asx), psz_backup, psz_parse );
406 else if( !strncasecmp( psz_parse, "<Copyright", 10 ) )
408 psz_backup = psz_parse+=11;
409 if( ( psz_parse = strcasestr( psz_parse, "</Copyright>" ) ) )
411 StoreString( p_demux, (b_entry ? &psz_copyright_entry : &psz_copyright_asx), psz_backup, psz_parse );
416 else if( !strncasecmp( psz_parse, "<MoreInfo ", 10 ) )
418 psz_parse = SkipBlanks(psz_parse+10, (unsigned)-1);
419 if( !strncasecmp( psz_parse, "HREF", 4 ) )
421 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
423 psz_backup = ++psz_parse;
424 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
426 StoreString( p_demux, (b_entry ? &psz_moreinfo_entry : &psz_moreinfo_asx), psz_backup, psz_parse );
432 if( ( psz_parse = strcasestr( psz_parse, "/>" ) ) )
436 else if( !strncasecmp( psz_parse, "<ABSTRACT>", 10 ) )
438 psz_backup = psz_parse+=10;
439 if( ( psz_parse = strcasestr( psz_parse, "</ABSTRACT>" ) ) )
441 StoreString( p_demux, (b_entry ? &psz_abstract_entry : &psz_abstract_asx), psz_backup, psz_parse );
446 else if( !strncasecmp( psz_parse, "<EntryRef ", 10 ) )
448 psz_parse = SkipBlanks(psz_parse+10, (unsigned)-1);
449 if( !strncasecmp( psz_parse, "HREF", 4 ) )
451 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
453 psz_backup = ++psz_parse;
454 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
456 i_strlen = psz_parse-psz_backup;
457 if( i_strlen < 1 ) continue;
458 psz_string = malloc( i_strlen +1);
459 memcpy( psz_string, psz_backup, i_strlen );
460 psz_string[i_strlen] = '\0';
461 input_item_t *p_input;
462 p_input = input_item_New( p_demux, psz_string, psz_title_asx );
463 input_item_CopyOptions( p_current_input, p_input );
464 input_item_AddSubItem( p_current_input, p_input );
465 vlc_gc_decref( p_input );
472 if( ( psz_parse = strcasestr( psz_parse, "/>" ) ) )
476 else if( !strncasecmp( psz_parse, "</Entry>", 8 ) )
478 input_item_t *p_entry = NULL;
479 char *psz_name = NULL;
481 char * ppsz_options[2];
484 /* add a new entry */
488 msg_Err( p_demux, "end of entry without start?" );
494 msg_Err( p_demux, "entry without href?" );
498 if( p_sys->b_skip_ads && b_skip_entry )
500 char *psz_current_input_name = input_item_GetName( p_current_input );
502 msg_Dbg( p_demux, "skipped entry %d %s (%s)",
504 ( psz_title_entry ? psz_title_entry : psz_current_input_name ), psz_href );
505 free( psz_current_input_name );
509 if( i_starttime || i_duration )
513 if( asprintf(ppsz_options+i_options, ":start-time=%d", i_starttime) == -1 )
514 *(ppsz_options+i_options) = NULL;
520 if( asprintf(ppsz_options+i_options, ":stop-time=%d", i_starttime + i_duration) == -1 )
521 *(ppsz_options+i_options) = NULL;
527 /* create the new entry */
528 char *psz_current_input_name = input_item_GetName( p_current_input );
529 if( asprintf( &psz_name, "%d %s", i_entry_count, ( psz_title_entry ? psz_title_entry : psz_current_input_name ) ) != -1 )
531 p_entry = input_item_NewExt( p_demux, psz_href, psz_name, i_options, (const char * const *)ppsz_options, -1 );
533 input_item_CopyOptions( p_current_input, p_entry );
536 psz_name = ppsz_options[--i_options];
541 if( psz_title_entry ) input_item_SetTitle( p_entry, psz_title_entry );
542 if( psz_artist_entry ) input_item_SetArtist( p_entry, psz_artist_entry );
543 if( psz_copyright_entry ) input_item_SetCopyright( p_entry, psz_copyright_entry );
544 if( psz_moreinfo_entry ) input_item_SetURL( p_entry, psz_moreinfo_entry );
545 if( psz_abstract_entry ) input_item_SetDescription( p_entry, psz_abstract_entry );
546 input_item_AddSubItem( p_current_input, p_entry );
547 vlc_gc_decref( p_entry );
549 free( psz_current_input_name );
553 FREENULL( psz_href );
554 FREENULL( psz_title_entry );
555 FREENULL( psz_base_entry );
556 FREENULL( psz_artist_entry );
557 FREENULL( psz_copyright_entry );
558 FREENULL( psz_moreinfo_entry );
559 FREENULL( psz_abstract_entry );
562 else if( !strncasecmp( psz_parse, "<Entry", 6 ) )
564 char *psz_clientskip;
568 msg_Err( p_demux, "We already are in an entry section" );
573 psz_clientskip = strcasestr( psz_parse, "clientskip=\"no\"" );
574 psz_parse = strcasestr( psz_parse, ">" );
576 /* If clientskip was enabled ... this is an ad */
577 b_skip_entry = (NULL != psz_clientskip) && (psz_clientskip < psz_parse);
579 // init entry details
584 else if( !strncasecmp( psz_parse, "<Ref ", 5 ) )
586 psz_parse = SkipBlanks(psz_parse+5, (unsigned)-1);
589 msg_Err( p_demux, "A ref outside an entry section" );
593 if( !strncasecmp( psz_parse, "HREF", 4 ) )
595 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
597 psz_backup = ++psz_parse;
598 psz_backup = SkipBlanks(psz_backup, (unsigned)-1);
599 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
602 i_strlen = psz_parse-psz_backup;
603 if( i_strlen < 1 ) continue;
606 psz_href = malloc( i_strlen +1);
607 memcpy( psz_href, psz_backup, i_strlen );
608 psz_href[i_strlen] = '\0';
609 psz_tmp = psz_href + (i_strlen-1);
610 while( psz_tmp >= psz_href &&
611 ( *psz_tmp == '\r' || *psz_tmp == '\n' ) )
621 if( ( psz_parse = strcasestr( psz_parse, ">" ) ) )
625 else if( !strncasecmp( psz_parse, "<starttime ", 11 ) )
627 psz_parse = SkipBlanks(psz_parse+11, (unsigned)-1);
630 msg_Err( p_demux, "starttime outside an entry section" );
634 if( !strncasecmp( psz_parse, "value", 5 ) )
636 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
638 psz_backup = ++psz_parse;
639 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
641 i_strlen = psz_parse-psz_backup;
642 if( i_strlen < 1 ) continue;
644 i_starttime = ParseTime(psz_backup, i_strlen);
650 if( ( psz_parse = strcasestr( psz_parse, ">" ) ) )
654 else if( !strncasecmp( psz_parse, "<duration ", 11 ) )
656 psz_parse = SkipBlanks(psz_parse+5, (unsigned)-1);
659 msg_Err( p_demux, "duration outside an entry section" );
663 if( !strncasecmp( psz_parse, "value", 5 ) )
665 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
667 psz_backup = ++psz_parse;
668 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
670 i_strlen = psz_parse-psz_backup;
671 if( i_strlen < 1 ) continue;
673 i_duration = ParseTime(psz_backup, i_strlen);
679 if( ( psz_parse = strcasestr( psz_parse, ">" ) ) )
683 else if( !strncasecmp( psz_parse, "</ASX", 5 ) )
685 if( psz_title_asx ) input_item_SetTitle( p_current_input, psz_title_asx );
686 if( psz_artist_asx ) input_item_SetArtist( p_current_input, psz_artist_asx );
687 if( psz_copyright_asx ) input_item_SetCopyright( p_current_input, psz_copyright_asx );
688 if( psz_moreinfo_asx ) input_item_SetURL( p_current_input, psz_moreinfo_asx );
689 if( psz_abstract_asx ) input_item_SetDescription( p_current_input, psz_abstract_asx );
690 FREENULL( psz_base_asx );
691 FREENULL( psz_title_asx );
692 FREENULL( psz_artist_asx );
693 FREENULL( psz_copyright_asx );
694 FREENULL( psz_moreinfo_asx );
695 FREENULL( psz_abstract_asx );
701 /* FIXME Unsupported elements */
709 HANDLE_PLAY_AND_RELEASE;
710 return 0; /* Needed for correct operation of go back */
713 static int Control( demux_t *p_demux, int i_query, va_list args )
715 VLC_UNUSED(p_demux); VLC_UNUSED(i_query); VLC_UNUSED(args);