1 /*****************************************************************************
2 * asx.c : ASX playlist format import
3 *****************************************************************************
4 * Copyright (C) 2005-2006 the VideoLAN team
7 * Authors: Derk-Jan Hartman <hartman at videolan dot org>
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License as published by
11 * the Free Software Foundation; either version 2 of the License, or
12 * (at your option) any later version.
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
19 * You should have received a copy of the GNU General Public License
20 * along with this program; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
22 *****************************************************************************/
24 /* See also: http://msdn.microsoft.com/library/en-us/wmplay10/mmp_sdk/windowsmediametafilereference.asp
27 /*****************************************************************************
29 *****************************************************************************/
34 #include <vlc_common.h>
35 #include <vlc_demux.h>
38 #include <vlc_charset.h>
51 /*****************************************************************************
53 *****************************************************************************/
54 static int Demux( demux_t *p_demux);
55 static int Control( demux_t *p_demux, int i_query, va_list args );
57 static int StoreString( demux_t *p_demux, char **ppsz_string,
58 const char *psz_source_start,
59 const char *psz_source_end )
61 demux_sys_t *p_sys = p_demux->p_sys;
62 unsigned len = psz_source_end - psz_source_start;
66 char *buf = *ppsz_string = malloc ((len * (1 + !p_sys->b_utf8)) + 1);
72 memcpy (buf, psz_source_start, len);
73 (*ppsz_string)[len] = '\0';
74 EnsureUTF8 (*ppsz_string);
78 /* Latin-1 -> UTF-8 */
79 for (unsigned i = 0; i < len; i++)
81 unsigned char c = psz_source_start[i];
84 *buf++ = 0xc0 | (c >> 6);
85 *buf++ = 0x80 | (c & 0x3f);
92 buf = *ppsz_string = realloc (*ppsz_string, buf - *ppsz_string);
97 static char *SkipBlanks(char *s, size_t i_strlen )
99 while( i_strlen > 0 ) {
116 static int ParseTime(char *s, size_t i_strlen)
118 // need to parse hour:minutes:sec.fraction string
121 const char *end = s + i_strlen;
122 // skip leading spaces if any
123 s = SkipBlanks(s, i_strlen);
126 while( (s < end) && isdigit(*s) )
128 int newval = val*10 + (*s - '0');
139 s = SkipBlanks(s, end-s);
143 s = SkipBlanks(s, end-s);
144 result = result * 60;
146 while( (s < end) && isdigit(*s) )
148 int newval = val*10 + (*s - '0');
159 s = SkipBlanks(s, end-s);
163 s = SkipBlanks(s, end-s);
164 result = result * 60;
166 while( (s < end) && isdigit(*s) )
168 int newval = val*10 + (*s - '0');
179 // TODO: one day, we may need to parse fraction for sub-second resolution
185 /*****************************************************************************
186 * Import_ASX: main import function
187 *****************************************************************************/
188 int Import_ASX( vlc_object_t *p_this )
190 demux_t *p_demux = (demux_t *)p_this;
191 const uint8_t *p_peek;
192 CHECK_PEEK( p_peek, 10 );
194 // skip over possible leading empty lines and empty spaces
195 p_peek = (uint8_t *)SkipBlanks((char *)p_peek, 6);
197 if( POKE( p_peek, "<asx", 4 ) || demux_IsPathExtension( p_demux, ".asx" ) ||
198 demux_IsPathExtension( p_demux, ".wax" ) || demux_IsPathExtension( p_demux, ".wvx" ) ||
199 demux_IsForced( p_demux, "asx-open" ) )
206 STANDARD_DEMUX_INIT_MSG( "found valid ASX playlist" );
207 p_demux->p_sys->psz_prefix = FindPrefix( p_demux );
208 p_demux->p_sys->psz_data = NULL;
209 p_demux->p_sys->i_data_len = -1;
210 p_demux->p_sys->b_utf8 = false;
211 p_demux->p_sys->b_skip_ads = config_GetInt( p_demux, "playlist-skip-ads" );
216 /*****************************************************************************
217 * Deactivate: frees unused data
218 *****************************************************************************/
219 void Close_ASX( vlc_object_t *p_this )
221 demux_t *p_demux = (demux_t *)p_this;
222 demux_sys_t *p_sys = p_demux->p_sys;
224 free( p_sys->psz_prefix );
225 free( p_sys->psz_data );
229 static int Demux( demux_t *p_demux )
231 demux_sys_t *p_sys = p_demux->p_sys;
232 char *psz_parse = NULL;
233 char *psz_backup = NULL;
234 bool b_entry = false;
235 input_item_t *p_input;
239 if( p_sys->i_data_len < 0 )
242 p_sys->i_data_len = stream_Size( p_demux->s ) +1; /* This is a cheat to prevent unnecessary realloc */
243 if( p_sys->i_data_len <= 0 && p_sys->i_data_len < 16384 ) p_sys->i_data_len = 1024;
244 p_sys->psz_data = malloc( p_sys->i_data_len * sizeof(char) +1);
246 /* load the complete file */
249 int i_read = stream_Read( p_demux->s, &p_sys->psz_data[i_pos], p_sys->i_data_len - i_pos );
250 p_sys->psz_data[i_read] = '\0';
252 if( i_read < p_sys->i_data_len - i_pos ) break; /* Done */
255 p_sys->i_data_len += 1024;
256 p_sys->psz_data = realloc( p_sys->psz_data, p_sys->i_data_len * sizeof( char * ) +1 );
258 if( p_sys->i_data_len <= 0 ) return -1;
261 psz_parse = p_sys->psz_data;
262 /* Find first element */
263 if( ( psz_parse = strcasestr( psz_parse, "<ASX" ) ) )
266 char *psz_string = NULL;
269 char *psz_base_asx = NULL;
270 char *psz_title_asx = NULL;
271 char *psz_artist_asx = NULL;
272 char *psz_copyright_asx = NULL;
273 char *psz_moreinfo_asx = NULL;
274 char *psz_abstract_asx = NULL;
276 char *psz_base_entry = NULL;
277 char *psz_title_entry = NULL;
278 char *psz_artist_entry = NULL;
279 char *psz_copyright_entry = NULL;
280 char *psz_moreinfo_entry = NULL;
281 char *psz_abstract_entry = NULL;
282 int i_entry_count = 0;
283 bool b_skip_entry = false;
285 char *psz_href = NULL;
289 psz_parse = strcasestr( psz_parse, ">" );
291 while( psz_parse && ( psz_parse = strcasestr( psz_parse, "<" ) ) )
293 if( !strncasecmp( psz_parse, "<!--", 4 ) )
295 /* this is a comment */
296 if( ( psz_parse = strcasestr( psz_parse, "-->" ) ) )
300 else if( !strncasecmp( psz_parse, "<PARAM ", 7 ) )
302 bool b_encoding_flag = false;
303 psz_parse = SkipBlanks(psz_parse+7, (unsigned)-1);
304 if( !strncasecmp( psz_parse, "name", 4 ) )
306 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
308 psz_backup = ++psz_parse;
309 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
311 i_strlen = psz_parse-psz_backup;
312 if( i_strlen < 1 ) continue;
313 msg_Dbg( p_demux, "param name strlen: %d", i_strlen);
314 psz_string = malloc( i_strlen *sizeof( char ) +1);
315 memcpy( psz_string, psz_backup, i_strlen );
316 psz_string[i_strlen] = '\0';
317 msg_Dbg( p_demux, "param name: %s", psz_string);
318 b_encoding_flag = !strcasecmp( psz_string, "encoding" );
326 if( !strncasecmp( psz_parse, "value", 5 ) )
328 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
330 psz_backup = ++psz_parse;
331 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
333 i_strlen = psz_parse-psz_backup;
334 if( i_strlen < 1 ) continue;
335 msg_Dbg( p_demux, "param value strlen: %d", i_strlen);
336 psz_string = malloc( i_strlen *sizeof( char ) +1);
337 memcpy( psz_string, psz_backup, i_strlen );
338 psz_string[i_strlen] = '\0';
339 msg_Dbg( p_demux, "param value: %s", psz_string);
340 if( b_encoding_flag && !strcasecmp( psz_string, "utf-8" ) ) p_sys->b_utf8 = true;
347 if( ( psz_parse = strcasestr( psz_parse, "/>" ) ) )
351 else if( !strncasecmp( psz_parse, "<BANNER", 7 ) )
353 /* We skip this element */
354 if( ( psz_parse = strcasestr( psz_parse, "</BANNER>" ) ) )
358 else if( !strncasecmp( psz_parse, "<PREVIEWDURATION", 16 ) ||
359 !strncasecmp( psz_parse, "<LOGURL", 7 ) ||
360 !strncasecmp( psz_parse, "<Skin", 5 ) )
362 /* We skip this element */
363 if( ( psz_parse = strcasestr( psz_parse, "/>" ) ) )
367 else if( !strncasecmp( psz_parse, "<BASE ", 6 ) )
369 psz_parse = SkipBlanks(psz_parse+6, (unsigned)-1);
370 if( !strncasecmp( psz_parse, "HREF", 4 ) )
372 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
374 psz_backup = ++psz_parse;
375 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
377 StoreString( p_demux, (b_entry ? &psz_base_entry : &psz_base_asx), psz_backup, psz_parse );
383 if( ( psz_parse = strcasestr( psz_parse, "/>" ) ) )
387 else if( !strncasecmp( psz_parse, "<TITLE>", 7 ) )
389 psz_backup = psz_parse+=7;
390 if( ( psz_parse = strcasestr( psz_parse, "</TITLE>" ) ) )
392 StoreString( p_demux, (b_entry ? &psz_title_entry : &psz_title_asx), psz_backup, psz_parse );
397 else if( !strncasecmp( psz_parse, "<Author>", 8 ) )
399 psz_backup = psz_parse+=8;
400 if( ( psz_parse = strcasestr( psz_parse, "</Author>" ) ) )
402 StoreString( p_demux, (b_entry ? &psz_artist_entry : &psz_artist_asx), psz_backup, psz_parse );
407 else if( !strncasecmp( psz_parse, "<Copyright", 10 ) )
409 psz_backup = psz_parse+=11;
410 if( ( psz_parse = strcasestr( psz_parse, "</Copyright>" ) ) )
412 StoreString( p_demux, (b_entry ? &psz_copyright_entry : &psz_copyright_asx), psz_backup, psz_parse );
417 else if( !strncasecmp( psz_parse, "<MoreInfo ", 10 ) )
419 psz_parse = SkipBlanks(psz_parse+10, (unsigned)-1);
420 if( !strncasecmp( psz_parse, "HREF", 4 ) )
422 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
424 psz_backup = ++psz_parse;
425 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
427 StoreString( p_demux, (b_entry ? &psz_moreinfo_entry : &psz_moreinfo_asx), psz_backup, psz_parse );
433 if( ( psz_parse = strcasestr( psz_parse, "/>" ) ) )
437 else if( !strncasecmp( psz_parse, "<ABSTRACT>", 10 ) )
439 psz_backup = psz_parse+=10;
440 if( ( psz_parse = strcasestr( psz_parse, "</ABSTRACT>" ) ) )
442 StoreString( p_demux, (b_entry ? &psz_abstract_entry : &psz_abstract_asx), psz_backup, psz_parse );
447 else if( !strncasecmp( psz_parse, "<EntryRef ", 10 ) )
449 psz_parse = SkipBlanks(psz_parse+10, (unsigned)-1);
450 if( !strncasecmp( psz_parse, "HREF", 4 ) )
452 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
454 psz_backup = ++psz_parse;
455 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
457 i_strlen = psz_parse-psz_backup;
458 if( i_strlen < 1 ) continue;
459 psz_string = malloc( i_strlen*sizeof( char ) +1);
460 memcpy( psz_string, psz_backup, i_strlen );
461 psz_string[i_strlen] = '\0';
462 p_input = input_ItemNew( p_demux, psz_string, psz_title_asx );
463 input_ItemCopyOptions( p_current_input, p_input );
464 input_ItemAddSubItem( p_current_input, p_input );
471 if( ( psz_parse = strcasestr( psz_parse, "/>" ) ) )
475 else if( !strncasecmp( psz_parse, "</Entry>", 8 ) )
477 input_item_t *p_entry = NULL;
478 char *psz_name = NULL;
480 char * ppsz_options[2];
483 /* add a new entry */
487 msg_Err( p_demux, "end of entry without start?" );
493 msg_Err( p_demux, "entry without href?" );
497 if( p_sys->b_skip_ads && b_skip_entry )
499 msg_Dbg( p_demux, "skipped entry %d %s (%s)",
500 i_entry_count, ( psz_title_entry ? psz_title_entry : p_current_input->psz_name ), psz_href );
504 if( i_starttime || i_duration )
507 asprintf(ppsz_options+i_options, ":start-time=%d", i_starttime);
511 asprintf(ppsz_options+i_options, ":stop-time=%d", i_starttime + i_duration);
516 /* create the new entry */
517 asprintf( &psz_name, "%d %s", i_entry_count, ( psz_title_entry ? psz_title_entry : p_current_input->psz_name ) );
519 p_entry = input_ItemNewExt( p_demux, psz_href, psz_name, i_options, (const char * const *)ppsz_options, -1 );
520 FREENULL( psz_name );
521 input_ItemCopyOptions( p_current_input, p_entry );
524 psz_name = ppsz_options[--i_options];
528 if( psz_title_entry ) input_item_SetTitle( p_entry, psz_title_entry );
529 if( psz_artist_entry ) input_item_SetArtist( p_entry, psz_artist_entry );
530 if( psz_copyright_entry ) input_item_SetCopyright( p_entry, psz_copyright_entry );
531 if( psz_moreinfo_entry ) input_item_SetURL( p_entry, psz_moreinfo_entry );
532 if( psz_abstract_entry ) input_item_SetDescription( p_entry, psz_abstract_entry );
533 input_ItemAddSubItem( p_current_input, p_entry );
534 vlc_gc_decref( p_entry );
538 FREENULL( psz_href );
539 FREENULL( psz_title_entry );
540 FREENULL( psz_base_entry );
541 FREENULL( psz_artist_entry );
542 FREENULL( psz_copyright_entry );
543 FREENULL( psz_moreinfo_entry );
544 FREENULL( psz_abstract_entry );
547 else if( !strncasecmp( psz_parse, "<Entry", 6 ) )
549 char *psz_clientskip;
553 msg_Err( p_demux, "We already are in an entry section" );
558 psz_clientskip = strcasestr( psz_parse, "clientskip=\"no\"" );
559 psz_parse = strcasestr( psz_parse, ">" );
561 /* If clientskip was enabled ... this is an ad */
562 b_skip_entry = (NULL != psz_clientskip) && (psz_clientskip < psz_parse);
564 // init entry details
570 else if( !strncasecmp( psz_parse, "<Ref ", 5 ) )
572 psz_parse = SkipBlanks(psz_parse+5, (unsigned)-1);
575 msg_Err( p_demux, "A ref outside an entry section" );
579 if( !strncasecmp( psz_parse, "HREF", 4 ) )
581 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
583 psz_backup = ++psz_parse;
584 psz_backup = SkipBlanks(psz_backup, (unsigned)-1);
585 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
588 i_strlen = psz_parse-psz_backup;
589 if( i_strlen < 1 ) continue;
592 psz_href = malloc( i_strlen*sizeof( char ) +1);
593 memcpy( psz_href, psz_backup, i_strlen );
594 psz_href[i_strlen] = '\0';
595 psz_tmp = psz_href + (i_strlen-1);
596 while( psz_tmp >= psz_href &&
597 ( *psz_tmp == '\r' || *psz_tmp == '\n' ) )
607 if( ( psz_parse = strcasestr( psz_parse, ">" ) ) )
611 else if( !strncasecmp( psz_parse, "<starttime ", 11 ) )
613 psz_parse = SkipBlanks(psz_parse+11, (unsigned)-1);
616 msg_Err( p_demux, "starttime outside an entry section" );
620 if( !strncasecmp( psz_parse, "value", 5 ) )
622 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
624 psz_backup = ++psz_parse;
625 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
627 i_strlen = psz_parse-psz_backup;
628 if( i_strlen < 1 ) continue;
630 i_starttime = ParseTime(psz_backup, i_strlen);
636 if( ( psz_parse = strcasestr( psz_parse, ">" ) ) )
640 else if( !strncasecmp( psz_parse, "<duration ", 11 ) )
642 psz_parse = SkipBlanks(psz_parse+5, (unsigned)-1);
645 msg_Err( p_demux, "duration outside an entry section" );
649 if( !strncasecmp( psz_parse, "value", 5 ) )
651 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
653 psz_backup = ++psz_parse;
654 if( ( psz_parse = strcasestr( psz_parse, "\"" ) ) )
656 i_strlen = psz_parse-psz_backup;
657 if( i_strlen < 1 ) continue;
659 i_duration = ParseTime(psz_backup, i_strlen);
665 if( ( psz_parse = strcasestr( psz_parse, ">" ) ) )
669 else if( !strncasecmp( psz_parse, "</ASX", 5 ) )
671 if( psz_title_asx ) input_item_SetTitle( p_current_input, psz_title_asx );
672 if( psz_artist_asx ) input_item_SetArtist( p_current_input, psz_artist_asx );
673 if( psz_copyright_asx ) input_item_SetCopyright( p_current_input, psz_copyright_asx );
674 if( psz_moreinfo_asx ) input_item_SetURL( p_current_input, psz_moreinfo_asx );
675 if( psz_abstract_asx ) input_item_SetDescription( p_current_input, psz_abstract_asx );
676 FREENULL( psz_base_asx );
677 FREENULL( psz_title_asx );
678 FREENULL( psz_artist_asx );
679 FREENULL( psz_copyright_asx );
680 FREENULL( psz_moreinfo_asx );
681 FREENULL( psz_abstract_asx );
687 /* FIXME Unsupported elements */
695 HANDLE_PLAY_AND_RELEASE;
696 return 0; /* Needed for correct operation of go back */
699 static int Control( demux_t *p_demux, int i_query, va_list args )
701 VLC_UNUSED(p_demux); VLC_UNUSED(i_query); VLC_UNUSED(args);