#ifndef __VLC_URL_H
# define __VLC_URL_H
-typedef struct
+struct vlc_url_t
{
char *psz_protocol;
char *psz_username;
char *psz_option;
char *psz_buffer; /* to be freed */
-} vlc_url_t;
+};
+
+VLC_EXPORT( char *, unescape_URI_duplicate, ( const char *psz ) );
+VLC_EXPORT( void, unescape_URI, ( char *psz ) );
+VLC_EXPORT( char *, decode_URI_duplicate, ( const char *psz ) );
+VLC_EXPORT( void, decode_URI, ( char *psz ) );
+VLC_EXPORT( char *, encode_URI_component, ( const char *psz ) );
/*****************************************************************************
* vlc_UrlParse:
char *psz_dup;
char *psz_parse;
char *p;
+ char *p2;
url->psz_protocol = NULL;
url->psz_username = NULL;
}
url->psz_buffer = psz_parse = psz_dup = strdup( psz_url );
+ /* Search a valid protocol */
p = strstr( psz_parse, ":/" );
+ if( p != NULL )
+ {
+ char *p2;
+ for( p2 = psz_parse; p2 < p; p2++ )
+ {
+#define I(i,a,b) ( (a) <= (i) && (i) <= (b) )
+ if( !I(*p2, 'a', 'z' ) && !I(*p2, 'A', 'Z') && !I(*p2, '0', '9') && *p2 != '+' && *p2 != '-' && *p2 != '.' )
+ {
+ p = NULL;
+ break;
+ }
+#undef I
+ }
+ }
+
if( p != NULL )
{
/* we have a protocol */
psz_parse = p;
}
p = strchr( psz_parse, '@' );
- if( p != NULL )
+ p2 = strchr( psz_parse, '/' );
+ if( p != NULL && ( p2 != NULL ? p < p2 : 1 ) )
{
/* We have a login */
url->psz_username = psz_parse;
/* We have a password */
*psz_parse++ = '\0';
url->psz_password = psz_parse;
+ decode_URI( url->psz_password );
}
-
+ decode_URI( url->psz_username );
psz_parse = p;
}
/*****************************************************************************
* vlc_UrlClean:
- *****************************************************************************
- *
*****************************************************************************/
static inline void vlc_UrlClean( vlc_url_t *url )
{
- if( url->psz_buffer ) free( url->psz_buffer );
- if( url->psz_host ) free( url->psz_host );
+ free( url->psz_buffer );
+ free( url->psz_host );
url->psz_protocol = NULL;
url->psz_username = NULL;
url->psz_buffer = NULL;
}
-static inline int isurlsafe( int c )
-{
- return ( (unsigned char)( c - 'a' ) < 26 )
- || ( (unsigned char)( c - 'A' ) < 26 )
- || ( (unsigned char)( c - '0' ) < 10 )
- || ( (unsigned char)( c ) > 127 )
- /* Hmm, we should not encode character that are allowed in URLs
- * (even if they are not URL-safe), nor URL-safe characters.
- * We still encode some of them because of Microsoft's crap browser.
- */
- || ( strchr( "-_.", c ) != NULL );
-}
-static inline char url_hexchar( int c )
-{
- return ( c < 10 ) ? c + '0' : c + 'A' - 10;
-}
-
-/*****************************************************************************
- * vlc_UrlEncode:
- *****************************************************************************
- * perform URL encoding
- * (you do NOT want to do URL decoding - it is not reversible - do NOT do it)
- *****************************************************************************/
static inline char *vlc_UrlEncode( const char *psz_url )
{
- char psz_enc[3 * strlen( psz_url ) + 1], *out = psz_enc;
- const unsigned char *in;
-
- for( in = (const unsigned char *)psz_url; *in; in++ )
- {
- unsigned char c = *in;
-
- if( isurlsafe( c ) )
- *out++ = (char)c;
- else
- {
- uint16_t cp;
-
- *out++ = '%';
- /* UTF-8 to UCS-2 conversion */
- if( ( c & 0x7f ) == 0 )
- cp = c;
- else
- if( ( c & 0xe0 ) == 0xc0 )
- {
- cp = ((c & 0x1f) << 6) | (in[1] & 0x3f);
- in++;
- }
- else
- if( ( c & 0xf0 ) == 0xe0 )
- {
- cp = ((c & 0xf) << 12) | ((in[1] & 0x3f) << 6) | (in[2] & 0x3f);
- in += 2;
- }
- else
- /* cannot URL-encode code points outside the BMP */
- return NULL;
-
- if( cp < 0xff )
- {
- /* Encode ISO-8859-1 characters */
- *out++ = url_hexchar( cp >> 4 );
- *out++ = url_hexchar( cp & 0xf );
- }
- else
- {
- /* Encode non-Latin-1 characters */
- *out++ = 'u';
- *out++ = url_hexchar( cp >> 12 );
- *out++ = url_hexchar((cp >> 8) & 0xf );
- *out++ = url_hexchar((cp >> 4) & 0xf );
- *out++ = url_hexchar( cp & 0xf );
- }
- }
- }
- *out++ = '\0';
-
- return strdup( psz_enc );
+ /* FIXME: do not encode / : ? and & _when_ not needed */
+ return encode_URI_component( psz_url );
}
-/*****************************************************************************
- * vlc_UrlIsNotEncoded:
- *****************************************************************************
- * check if given string is not a valid URL and must hence be encoded
- *****************************************************************************/
#include <ctype.h>
+/** Check whether a given string is not a valid URL and must hence be
+ * encoded */
static inline int vlc_UrlIsNotEncoded( const char *psz_url )
{
const char *ptr;
ptr += 2;
}
else
- if( !isurlsafe( c ) )
+ if( ( (unsigned char)( c - 'a' ) < 26 )
+ || ( (unsigned char)( c - 'A' ) < 26 )
+ || ( (unsigned char)( c - '0' ) < 10 )
+ || ( strchr( "-_.", c ) != NULL ) )
return 1;
}
return 0; /* looks fine - but maybe it is not encoded */
}
-/*****************************************************************************
- * vlc_b64_encode:
- *****************************************************************************
- *
- *****************************************************************************/
-static inline char *vlc_b64_encode( char *src )
-{
- static const char b64[] =
- "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
- size_t len = strlen( src );
-
- char *ret;
- char *dst = (char *)malloc( ( len + 4 ) * 4 / 3 );
- if( dst == NULL )
- return NULL;
-
- ret = dst;
-
- while( len > 0 )
- {
- /* pops (up to) 3 bytes of input */
- uint32_t v = *src++ << 24;
- if( len >= 2 )
- {
- v |= *src++ << 16;
- if( len >= 3 )
- v |= *src++ << 8;
- }
-
- /* pushes (up to) 4 bytes of output */
- while( v )
- {
- *dst++ = b64[v >> 26];
- v = v << 6;
- }
-
- switch( len )
- {
- case 1:
- *dst++ = '=';
- *dst++ = '=';
- len--;
- break;
-
- case 2:
- *dst++ = '=';
- len -= 2;
- break;
-
- default:
- len -= 3;
- }
- }
-
- *dst = '\0';
-
- return ret;
-}
#endif