+/*****************************************************************************
+ * utf8.c: Test for UTF-8 encoding/decoding stuff
+ *****************************************************************************
+ * Copyright (C) 2006 Rémi Denis-Courmont
+ * $Id$
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
+ *****************************************************************************/
+
+#include <vlc/vlc.h>
+#include "vlc_charset.h"
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <stdbool.h>
+
+static void test (const char *in, const char *out)
+{
+ bool isutf8 = !strcmp (in, out);
+ char *str = strdup (in);
+ if (str == NULL)
+ abort ();
+
+ if (isutf8)
+ printf ("\"%s\" should be accepted...\n", in);
+ else
+ printf ("\"%s\" should be rewritten as \"%s\"...\n", in, out);
+
+ if ((IsUTF8 (in) != NULL) != isutf8)
+ {
+ printf (" ERROR: IsUTF8 (%s) failed\n", in);
+ exit (1);
+ }
+
+ if ((EnsureUTF8 (str) != NULL) != isutf8)
+ {
+ printf (" ERROR: EnsureUTF8 (%s) failed\n", in);
+ exit (2);
+ }
+
+ if (strcmp (str, out))
+ {
+ printf (" ERROR: got \"%s\"\n", str);
+ exit (3);
+ }
+
+ if ((EnsureUTF8 (str) == NULL) || IsUTF8 (str) == NULL)
+ {
+ printf (" ERROR: EnsureUTF8 (%s) is not UTF-8\n", in);
+ exit (4);
+ }
+ free (str);
+}
+
+int main (void)
+{
+ (void)setvbuf (stdout, NULL, _IONBF, 0);
+ test ("", "");
+
+ test ("this_should_not_be_modified_1234",
+ "this_should_not_be_modified_1234");
+
+ test ("\xFF", "?"); // invalid byte
+ test ("\xEF\xBB\xBFHello", "\xEF\xBB\xBFHello"); // BOM
+ test ("\x00\xE9", ""); // no conversion past end of string
+
+ test ("T\xC3\xA9l\xC3\xA9vision \xE2\x82\xAC", "Télévision €");
+ test ("T\xE9l\xE9vision", "T?l?vision");
+ test ("\xC1\x94\xC3\xa9l\xC3\xA9vision", "??élévision"); /* overlong */
+
+ test ("Hel\xF0\x83\x85\x87lo", "Hel????lo"); /* more overlong */
+ return 0;
+}