1 /*****************************************************************************
2 * xurl.c: URL manipulation functions
3 *****************************************************************************
4 * Copyright (C) 2003-2004 Commonwealth Scientific and Industrial Research
5 * Organisation (CSIRO) Australia
6 * Copyright (C) 2004 the VideoLAN team
10 * Authors: Andre Pang <Andre.Pang@csiro.au>
12 * This program is free software; you can redistribute it and/or modify
13 * it under the terms of the GNU General Public License as published by
14 * the Free Software Foundation; either version 2 of the License, or
15 * (at your option) any later version.
17 * This program is distributed in the hope that it will be useful,
18 * but WITHOUT ANY WARRANTY; without even the implied warranty of
19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20 * GNU General Public License for more details.
22 * You should have received a copy of the GNU General Public License
23 * along with this program; if not, write to the Free Software
24 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
25 *****************************************************************************/
32 static char *streallocat( char *psz_string, char *psz_to_append );
35 static char *xurl_strdup( const char *psz_string );
37 #define xurl_strdup strdup
40 static char *XURL_FindHostname ( char *psz_url );
41 static char *XURL_FindPath ( char *psz_url );
42 static char *XURL_FindFragment ( char *psz_url );
45 char *XURL_Join( char *psz_url1, char *psz_url2 )
47 if( XURL_IsAbsolute( psz_url1 ) )
48 return XURL_Concat( psz_url1, psz_url2 );
50 return XURL_Concat( psz_url2, psz_url1 );
55 /* TODO: replace XURL_Concat's rel/absolute calculation with the one
56 * specified by RFC2396, and also test it on their test suite :) */
59 char *XURL_Concat( char *psz_url, char *psz_append )
61 char *psz_return_value = NULL;
63 if( XURL_IsAbsolute( psz_append ) == XURL_TRUE )
64 return strdup( psz_append );
66 if( XURL_IsAbsolute( psz_url ) )
68 if( XURL_HasAbsolutePath( psz_append ) )
72 psz_concat_url = XURL_GetSchemeAndHostname( psz_url );
74 psz_concat_url = streallocat( psz_concat_url, psz_append );
76 fprintf( stderr, "XURL_Concat: concat is \"%s\"\n",
79 psz_return_value = psz_concat_url;
83 /* psz_append is a relative URL */
86 /* strip off last path component */
87 psz_new_url = XURL_GetHead( psz_url );
88 psz_new_url = streallocat( psz_new_url, psz_append );
90 psz_return_value = psz_new_url;
95 /* not an absolute URL */
96 if( XURL_HasAbsolutePath( psz_append ) == XURL_FALSE )
98 char *psz_new_url = XURL_GetHead( psz_url );
100 psz_new_url = streallocat( psz_new_url, psz_append );
101 psz_return_value = psz_new_url;
105 /* URL to append has an absolute path -- just use that instead */
106 psz_return_value = xurl_strdup( psz_append );
110 return psz_return_value;
114 XURL_Bool XURL_IsAbsolute( char *psz_url )
116 if( XURL_FindHostname( psz_url ) == NULL )
119 fprintf( stderr, "XURL_IsAbsolute(%s) returning false\n", psz_url );
126 fprintf( stderr, "XURL_IsAbsolute(%s) returning true\n", psz_url );
133 XURL_Bool XURL_HasFragment( char *psz_url )
135 if( XURL_FindFragment( psz_url ) == NULL )
142 char *XURL_FindHostname( char *psz_url )
144 char *psz_return_value = NULL;
146 char *psz_scheme_separator = strstr( psz_url, "://" );
147 if( psz_scheme_separator != NULL)
149 char *psz_hostname = psz_scheme_separator + strlen( "://" );
150 if( *psz_hostname != '\0') psz_return_value = psz_hostname;
153 fprintf( stderr, "XURL_FindHostname(%s): returning \"%s\"\n",
154 psz_url, psz_return_value );
158 return psz_return_value;
162 XURL_Bool XURL_HasAbsolutePath( char *psz_url )
164 #ifdef XURL_WIN32_PATHING
165 if( psz_url[0] == '/' || psz_url[0] == '\\' )
167 if( psz_url[0] == '/' )
175 char *XURL_GetHostname( char *psz_url )
177 char *psz_return_value = NULL;
178 char *psz_hostname = XURL_FindHostname( psz_url );
180 if( psz_hostname != NULL )
182 char *psz_new_hostname;
183 size_t i_hostname_length;
185 char *psz_one_past_end_of_hostname = strchr( psz_hostname, '/' );
186 if( psz_one_past_end_of_hostname != NULL)
188 /* Found a '/' after the hostname, so copy characters between
189 * the hostname and the '/' to a new string */
190 i_hostname_length = psz_one_past_end_of_hostname -
195 /* Didn't find a '/', so copy from the start of the hostname
196 * until the end of the string */
197 i_hostname_length = strlen( psz_url ) - ( psz_hostname - psz_url );
200 /* Copy hostname to a new string */
201 psz_new_hostname = xurl_malloc( i_hostname_length );
202 if (psz_new_hostname == NULL) return NULL;
203 strncpy( psz_new_hostname, psz_hostname, i_hostname_length );
206 fprintf (stderr, "XURL_GetHostname: psz_new_hostname is \"%s\"\n",
209 psz_return_value = psz_new_hostname;
213 /* Didn't find a hostname */
217 return psz_return_value;
221 char *XURL_GetSchemeAndHostname( char *psz_url )
223 char *psz_scheme, *psz_hostname, *psz_scheme_and_hostname;
225 psz_scheme = XURL_GetScheme( psz_url );
226 if( psz_scheme == NULL ) return NULL;
228 psz_hostname = XURL_GetHostname( psz_url );
229 if( psz_hostname == NULL ) return NULL;
231 /* malloc +1 for the terminating '\0' */
232 psz_scheme_and_hostname = xurl_malloc(
233 strlen( psz_scheme ) + strlen( "://" ) +
234 strlen( psz_hostname ) + 1);
235 if( psz_scheme_and_hostname == NULL ) return NULL;
236 (void) strcpy( psz_scheme_and_hostname, psz_scheme );
237 (void) strcat( psz_scheme_and_hostname, "://" );
238 (void) strcat( psz_scheme_and_hostname, psz_hostname );
240 if (psz_scheme_and_hostname == NULL ) return NULL;
241 return psz_scheme_and_hostname;
245 char *XURL_FindFragment( char *psz_url )
247 char *pc_hash = NULL;
248 char *pc_return_value = NULL;
250 pc_hash = strchr( psz_url, '#' );
251 if( pc_hash != NULL )
253 pc_return_value = pc_hash;
256 return pc_return_value;
260 char *XURL_FindQuery( char *psz_url )
262 char *pc_question_mark = NULL;
263 char *pc_return_value = NULL;
265 pc_question_mark = strchr( psz_url, '?' );
266 if( pc_question_mark != NULL )
268 pc_return_value = pc_question_mark;
271 return pc_return_value;
275 char *XURL_GetScheme( char *psz_url )
278 size_t i_scheme_length;
281 if( XURL_IsAbsolute( psz_url ) == XURL_FALSE ) return strdup( "file" );
283 /* this strchr will always succeed since we have an absolute URL, and thus
285 psz_colon = strchr( psz_url, ':' );
287 i_scheme_length = psz_colon - psz_url;
289 new_scheme = xurl_malloc( i_scheme_length );
290 if( new_scheme == NULL ) return NULL;
292 strncpy( new_scheme, psz_url, i_scheme_length );
298 XURL_Bool XURL_IsFileURL( char *psz_url )
300 XURL_Bool b_return_value;
301 char *psz_scheme = XURL_GetScheme( psz_url );
303 if( strcasecmp( psz_scheme, "file" ) == 0 )
304 b_return_value = XURL_TRUE;
306 b_return_value = XURL_FALSE;
308 xurl_free( psz_scheme );
310 return b_return_value;
315 char *xurl_strdup( const char *psz_string )
318 char *psz_new_string;
320 if( !psz_string ) return NULL;
322 i_length = strlen( psz_string ) + 1;
323 psz_new_string = (char *) xurl_malloc( i_length );
324 if( psz_new_string == NULL ) return NULL;
326 memcpy( psz_new_string, psz_string, i_length );
328 return psz_new_string;
333 char *XURL_FindPath( char *psz_url )
335 char *psz_return_value = NULL;
337 if( XURL_IsAbsolute( psz_url ) == XURL_TRUE )
339 char *psz_start_of_hostname = XURL_FindHostname( psz_url );
340 if( psz_start_of_hostname != NULL )
342 char *psz_start_of_path = strchr( psz_start_of_hostname, '/' );
343 psz_return_value = psz_start_of_path;
348 if( XURL_HasAbsolutePath( psz_url ) == XURL_TRUE )
350 psz_return_value = psz_url;
354 return xurl_strdup (".");
358 return psz_return_value;
362 char *XURL_GetPath( char *psz_url )
364 char *psz_return_value = NULL;
365 char *psz_path = NULL;
366 char *pc_question_mark = NULL;
367 char *pc_fragment = NULL;
369 psz_path = xurl_strdup( XURL_FindPath( psz_url ) );
371 fprintf( stderr, "XURL_GetPath: XURL_FindPath returning \"%s\"\n",
374 psz_return_value = psz_path;
376 pc_question_mark = XURL_FindQuery( psz_path );
377 if( pc_question_mark != NULL )
379 int i_path_length = pc_question_mark - psz_path;
380 *( psz_path + i_path_length ) = '\0';
383 pc_fragment = XURL_FindFragment( psz_path );
384 if( pc_fragment != NULL )
387 fprintf( stderr, "XURL_GetPath: XURL_FindFragment returned \"%s\"\n",
390 int i_path_length = pc_fragment - psz_path;
391 *( psz_path + i_path_length ) = '\0';
395 fprintf( stderr, "XURL_GetPath returning \"%s\"\n", psz_return_value );
398 return psz_return_value;
402 char *XURL_GetHead( const char *psz_path )
407 /* kill everything up to the last / (including the /) */
408 #ifdef XURL_WIN32_PATHING
409 /* Windows: Try looking for a \ first; if we don't find one, look for / */
410 pc_last_slash = strrchr( psz_path, '\\' );
411 if( pc_last_slash == NULL )
412 pc_last_slash = strrchr( psz_path, '/' );
414 pc_last_slash = strrchr( psz_path, '/' );
416 if( pc_last_slash == NULL )
418 psz_path_head = xurl_strdup( psz_path );
422 size_t i_characters_until_last_slash;
424 i_characters_until_last_slash = pc_last_slash - psz_path;
425 psz_path_head = malloc(
426 ( i_characters_until_last_slash + 1 ) * sizeof(char) );
427 (void) strncpy( psz_path_head, psz_path,
428 i_characters_until_last_slash + 1 );
430 /* terminate the resulting string with '\0' */
432 i_characters_until_last_slash) = '\0';
435 /* append a trailing / */
436 streallocat( psz_path_head, "/" );
438 return psz_path_head;
442 char *XURL_GetWithoutFragment( char *psz_url )
444 char *psz_return_value = NULL;
447 psz_fragment = XURL_FindFragment( psz_url );
448 if( psz_fragment == NULL )
450 psz_return_value = xurl_strdup( psz_url );
454 size_t i_pre_fragment_length;
455 char *psz_without_fragment;
457 i_pre_fragment_length = psz_fragment - psz_url;
459 psz_without_fragment = xurl_malloc( i_pre_fragment_length + 1 );
460 if( psz_without_fragment == NULL )
462 psz_return_value = NULL;
466 memcpy( psz_without_fragment, psz_url, i_pre_fragment_length );
467 *( psz_without_fragment + i_pre_fragment_length ) = '\0';
468 psz_return_value = psz_without_fragment;
472 return psz_return_value;
476 char *streallocat( char *psz_string, char *psz_to_append )
478 size_t i_new_string_length = strlen( psz_string ) +
479 strlen( psz_to_append ) + 1;
481 psz_string = (char *) realloc( psz_string, i_new_string_length );
483 return strcat( psz_string, psz_to_append );