mirror of
https://gitlab.gnome.org/GNOME/glib.git
synced 2025-01-06 04:46:16 +01:00
22cd18500d
Spotted when temporarily compiling with -Wwrite-strings. This only goes a small way towards making the code base -Wwrite-strings–clean. It introduces no functional changes, and fixes no bugs. Signed-off-by: Philip Withnall <withnall@endlessm.com> Reviewed-by: nobody
958 lines
27 KiB
C
958 lines
27 KiB
C
/* GLIB - Library of useful routines for C programming
|
|
* Copyright (C) 1995-1997 Peter Mattis, Spencer Kimball and Josh MacDonald
|
|
*
|
|
* This library is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* This library is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with this library; if not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
/*
|
|
* Modified by the GLib Team and others 1997-2000. See the AUTHORS
|
|
* file for a list of people on the GLib Team. See the ChangeLog
|
|
* files for a list of changes. These files are distributed with
|
|
* GLib at ftp://ftp.gtk.org/pub/gtk/.
|
|
*/
|
|
|
|
#undef G_DISABLE_ASSERT
|
|
#undef G_LOG_DOMAIN
|
|
|
|
#include <locale.h>
|
|
#include <string.h>
|
|
|
|
#include <glib.h>
|
|
|
|
/* Bug 311337 */
|
|
static void
|
|
test_iconv_state (void)
|
|
{
|
|
const gchar *in = "\xf4\xe5\xf8\xe5\xed";
|
|
const gchar *expected = "\xd7\xa4\xd7\x95\xd7\xa8\xd7\x95\xd7\x9d";
|
|
gchar *out;
|
|
gsize bytes_read = 0;
|
|
gsize bytes_written = 0;
|
|
GError *error = NULL;
|
|
|
|
out = g_convert (in, -1, "UTF-8", "CP1255",
|
|
&bytes_read, &bytes_written, &error);
|
|
|
|
if (error && error->code == G_CONVERT_ERROR_NO_CONVERSION)
|
|
return; /* silently skip if CP1255 is not supported, see bug 467707 */
|
|
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (bytes_read, ==, 5);
|
|
g_assert_cmpint (bytes_written, ==, 10);
|
|
g_assert_cmpstr (out, ==, expected);
|
|
g_free (out);
|
|
}
|
|
|
|
/* Some tests involving "vulgar fraction one half" (U+00BD). This is
|
|
* represented in UTF-8 as \xC2\xBD, in ISO-8859-1 as \xBD, and is not
|
|
* represented in ISO-8859-15. */
|
|
static void
|
|
test_one_half (void)
|
|
{
|
|
const gchar *in_utf8 = "\xc2\xbd";
|
|
gchar *out;
|
|
gsize bytes_read = 0;
|
|
gsize bytes_written = 0;
|
|
GError *error = NULL;
|
|
|
|
out = g_convert (in_utf8, -1,
|
|
"ISO-8859-1", "UTF-8",
|
|
&bytes_read, &bytes_written,
|
|
&error);
|
|
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (bytes_read, ==, 2);
|
|
g_assert_cmpint (bytes_written, ==, 1);
|
|
g_assert_cmpstr (out, ==, "\xbd");
|
|
g_free (out);
|
|
|
|
out = g_convert (in_utf8, -1,
|
|
"ISO-8859-15", "UTF-8",
|
|
&bytes_read, &bytes_written,
|
|
&error);
|
|
|
|
g_assert_error (error, G_CONVERT_ERROR, G_CONVERT_ERROR_ILLEGAL_SEQUENCE);
|
|
g_assert_cmpint (bytes_read, ==, 0);
|
|
g_assert_cmpint (bytes_written, ==, 0);
|
|
g_assert_cmpstr (out, ==, NULL);
|
|
g_clear_error (&error);
|
|
g_free (out);
|
|
|
|
out = g_convert_with_fallback (in_utf8, -1,
|
|
"ISO8859-15", "UTF-8",
|
|
"a",
|
|
&bytes_read, &bytes_written,
|
|
&error);
|
|
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (bytes_read, ==, 2);
|
|
g_assert_cmpint (bytes_written, ==, 1);
|
|
g_assert_cmpstr (out, ==, "a");
|
|
g_free (out);
|
|
}
|
|
|
|
static void
|
|
test_byte_order (void)
|
|
{
|
|
gchar in_be[4] = { 0xfe, 0xff, 0x03, 0x93}; /* capital gamma */
|
|
gchar in_le[4] = { 0xff, 0xfe, 0x93, 0x03};
|
|
const gchar *expected = "\xce\x93";
|
|
gchar *out;
|
|
gsize bytes_read = 0;
|
|
gsize bytes_written = 0;
|
|
GError *error = NULL;
|
|
|
|
out = g_convert (in_be, sizeof (in_be),
|
|
"UTF-8", "UTF-16",
|
|
&bytes_read, &bytes_written,
|
|
&error);
|
|
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (bytes_read, ==, 4);
|
|
g_assert_cmpint (bytes_written, ==, 2);
|
|
g_assert_cmpstr (out, ==, expected);
|
|
g_free (out);
|
|
|
|
out = g_convert (in_le, sizeof (in_le),
|
|
"UTF-8", "UTF-16",
|
|
&bytes_read, &bytes_written,
|
|
&error);
|
|
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (bytes_read, ==, 4);
|
|
g_assert_cmpint (bytes_written, ==, 2);
|
|
g_assert_cmpstr (out, ==, expected);
|
|
g_free (out);
|
|
}
|
|
|
|
static void
|
|
check_utf8_to_ucs4 (const char *utf8,
|
|
glong utf8_len,
|
|
const gunichar *ucs4,
|
|
glong ucs4_len,
|
|
glong error_pos)
|
|
{
|
|
gunichar *result, *result2, *result3;
|
|
glong items_read, items_read2;
|
|
glong items_written, items_written2;
|
|
GError *error, *error2, *error3;
|
|
gint i;
|
|
|
|
if (!error_pos)
|
|
{
|
|
/* check the fast conversion */
|
|
result = g_utf8_to_ucs4_fast (utf8, utf8_len, &items_written);
|
|
|
|
g_assert_cmpint (items_written, ==, ucs4_len);
|
|
g_assert (result);
|
|
for (i = 0; i <= items_written; i++)
|
|
g_assert (result[i] == ucs4[i]);
|
|
|
|
g_free (result);
|
|
}
|
|
|
|
error = NULL;
|
|
result = g_utf8_to_ucs4 (utf8, utf8_len, &items_read, &items_written, &error);
|
|
|
|
if (utf8_len == strlen (utf8))
|
|
{
|
|
/* check that len == -1 yields identical results */
|
|
error2 = NULL;
|
|
result2 = g_utf8_to_ucs4 (utf8, -1, &items_read2, &items_written2, &error2);
|
|
g_assert (error || items_read2 == items_read);
|
|
g_assert (error || items_written2 == items_written);
|
|
g_assert_cmpint (!!result, ==, !!result2);
|
|
g_assert_cmpint (!!error, ==, !!error2);
|
|
if (result)
|
|
for (i = 0; i <= items_written; i++)
|
|
g_assert (result[i] == result2[i]);
|
|
|
|
g_free (result2);
|
|
if (error2)
|
|
g_error_free (error2);
|
|
}
|
|
|
|
error3 = NULL;
|
|
result3 = g_utf8_to_ucs4 (utf8, utf8_len, NULL, NULL, &error3);
|
|
|
|
if (error3 && error3->code == G_CONVERT_ERROR_PARTIAL_INPUT)
|
|
{
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (items_read, ==, error_pos);
|
|
g_assert_cmpint (items_written, ==, ucs4_len);
|
|
g_assert (result);
|
|
for (i = 0; i <= items_written; i++)
|
|
g_assert (result[i] == ucs4[i]);
|
|
g_error_free (error3);
|
|
}
|
|
else if (error_pos)
|
|
{
|
|
g_assert (error != NULL);
|
|
g_assert (result == NULL);
|
|
g_assert_cmpint (items_read, ==, error_pos);
|
|
g_error_free (error);
|
|
|
|
g_assert (error3 != NULL);
|
|
g_assert (result3 == NULL);
|
|
g_error_free (error3);
|
|
}
|
|
else
|
|
{
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (items_read, ==, utf8_len);
|
|
g_assert_cmpint (items_written, ==, ucs4_len);
|
|
g_assert (result);
|
|
for (i = 0; i <= items_written; i++)
|
|
g_assert (result[i] == ucs4[i]);
|
|
|
|
g_assert_no_error (error3);
|
|
g_assert (result3);
|
|
for (i = 0; i <= ucs4_len; i++)
|
|
g_assert (result3[i] == ucs4[i]);
|
|
}
|
|
|
|
g_free (result);
|
|
g_free (result3);
|
|
}
|
|
|
|
static void
|
|
check_ucs4_to_utf8 (const gunichar *ucs4,
|
|
glong ucs4_len,
|
|
const char *utf8,
|
|
glong utf8_len,
|
|
glong error_pos)
|
|
{
|
|
gchar *result, *result2, *result3;
|
|
glong items_read, items_read2;
|
|
glong items_written, items_written2;
|
|
GError *error, *error2, *error3;
|
|
|
|
error = NULL;
|
|
result = g_ucs4_to_utf8 (ucs4, ucs4_len, &items_read, &items_written, &error);
|
|
|
|
if (ucs4[ucs4_len] == 0)
|
|
{
|
|
/* check that len == -1 yields identical results */
|
|
error2 = NULL;
|
|
result2 = g_ucs4_to_utf8 (ucs4, -1, &items_read2, &items_written2, &error2);
|
|
|
|
g_assert (error || items_read2 == items_read);
|
|
g_assert (error || items_written2 == items_written);
|
|
g_assert_cmpint (!!result, ==, !!result2);
|
|
g_assert_cmpint (!!error, ==, !!error2);
|
|
if (result)
|
|
g_assert_cmpstr (result, ==, result2);
|
|
|
|
g_free (result2);
|
|
if (error2)
|
|
g_error_free (error2);
|
|
}
|
|
|
|
error3 = NULL;
|
|
result3 = g_ucs4_to_utf8 (ucs4, ucs4_len, NULL, NULL, &error3);
|
|
|
|
if (error_pos)
|
|
{
|
|
g_assert (error != NULL);
|
|
g_assert (result == NULL);
|
|
g_assert_cmpint (items_read, ==, error_pos);
|
|
g_error_free (error);
|
|
|
|
g_assert (error3 != NULL);
|
|
g_assert (result3 == NULL);
|
|
g_error_free (error3);
|
|
}
|
|
else
|
|
{
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (items_read, ==, ucs4_len);
|
|
g_assert_cmpint (items_written, ==, utf8_len);
|
|
g_assert (result);
|
|
g_assert_cmpstr (result, ==, utf8);
|
|
|
|
g_assert_no_error (error3);
|
|
g_assert (result3);
|
|
g_assert_cmpstr (result3, ==, utf8);
|
|
}
|
|
|
|
g_free (result);
|
|
g_free (result3);
|
|
}
|
|
|
|
static void
|
|
check_utf8_to_utf16 (const char *utf8,
|
|
glong utf8_len,
|
|
const gunichar2 *utf16,
|
|
glong utf16_len,
|
|
glong error_pos)
|
|
{
|
|
gunichar2 *result, *result2, *result3;
|
|
glong items_read, items_read2;
|
|
glong items_written, items_written2;
|
|
GError *error, *error2, *error3;
|
|
gint i;
|
|
|
|
error = NULL;
|
|
result = g_utf8_to_utf16 (utf8, utf8_len, &items_read, &items_written, &error);
|
|
|
|
if (utf8_len == strlen (utf8))
|
|
{
|
|
/* check that len == -1 yields identical results */
|
|
error2 = NULL;
|
|
result2 = g_utf8_to_utf16 (utf8, -1, &items_read2, &items_written2, &error2);
|
|
g_assert (error || items_read2 == items_read);
|
|
g_assert (error || items_written2 == items_written);
|
|
g_assert_cmpint (!!result, ==, !!result2);
|
|
g_assert_cmpint (!!error, ==, !!error2);
|
|
if (result)
|
|
for (i = 0; i <= items_written; i++)
|
|
g_assert (result[i] == result2[i]);
|
|
|
|
g_free (result2);
|
|
if (error2)
|
|
g_error_free (error2);
|
|
}
|
|
|
|
error3 = NULL;
|
|
result3 = g_utf8_to_utf16 (utf8, utf8_len, NULL, NULL, &error3);
|
|
|
|
if (error3 && error3->code == G_CONVERT_ERROR_PARTIAL_INPUT)
|
|
{
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (items_read, ==, error_pos);
|
|
g_assert_cmpint (items_written, ==, utf16_len);
|
|
g_assert (result);
|
|
for (i = 0; i <= items_written; i++)
|
|
g_assert (result[i] == utf16[i]);
|
|
g_error_free (error3);
|
|
}
|
|
else if (error_pos)
|
|
{
|
|
g_assert (error != NULL);
|
|
g_assert (result == NULL);
|
|
g_assert_cmpint (items_read, ==, error_pos);
|
|
g_error_free (error);
|
|
|
|
g_assert (error3 != NULL);
|
|
g_assert (result3 == NULL);
|
|
g_error_free (error3);
|
|
}
|
|
else
|
|
{
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (items_read, ==, utf8_len);
|
|
g_assert_cmpint (items_written, ==, utf16_len);
|
|
g_assert (result);
|
|
for (i = 0; i <= items_written; i++)
|
|
g_assert (result[i] == utf16[i]);
|
|
|
|
g_assert_no_error (error3);
|
|
g_assert (result3);
|
|
for (i = 0; i <= utf16_len; i++)
|
|
g_assert (result3[i] == utf16[i]);
|
|
}
|
|
|
|
g_free (result);
|
|
g_free (result3);
|
|
}
|
|
|
|
static void
|
|
check_utf16_to_utf8 (const gunichar2 *utf16,
|
|
glong utf16_len,
|
|
const char *utf8,
|
|
glong utf8_len,
|
|
glong error_pos)
|
|
{
|
|
gchar *result, *result2, *result3;
|
|
glong items_read, items_read2;
|
|
glong items_written, items_written2;
|
|
GError *error, *error2, *error3;
|
|
|
|
error = NULL;
|
|
result = g_utf16_to_utf8 (utf16, utf16_len, &items_read, &items_written, &error);
|
|
if (utf16[utf16_len] == 0)
|
|
{
|
|
/* check that len == -1 yields identical results */
|
|
error2 = NULL;
|
|
result2 = g_utf16_to_utf8 (utf16, -1, &items_read2, &items_written2, &error2);
|
|
|
|
g_assert (error || items_read2 == items_read);
|
|
g_assert (error || items_written2 == items_written);
|
|
g_assert_cmpint (!!result, ==, !!result2);
|
|
g_assert_cmpint (!!error, ==, !!error2);
|
|
if (result)
|
|
g_assert_cmpstr (result, ==, result2);
|
|
|
|
g_free (result2);
|
|
if (error2)
|
|
g_error_free (error2);
|
|
}
|
|
|
|
error3 = NULL;
|
|
result3 = g_utf16_to_utf8 (utf16, utf16_len, NULL, NULL, &error3);
|
|
|
|
if (error3 && error3->code == G_CONVERT_ERROR_PARTIAL_INPUT)
|
|
{
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (items_read, ==, error_pos);
|
|
g_assert_cmpint (items_read + 1, ==, utf16_len);
|
|
g_assert_cmpint (items_written, ==, utf8_len);
|
|
g_assert (result);
|
|
g_assert_cmpstr (result, ==, utf8);
|
|
g_error_free (error3);
|
|
}
|
|
else if (error_pos)
|
|
{
|
|
g_assert (error != NULL);
|
|
g_assert (result == NULL);
|
|
g_assert_cmpint (items_read, ==, error_pos);
|
|
g_error_free (error);
|
|
|
|
g_assert (error3 != NULL);
|
|
g_assert (result3 == NULL);
|
|
g_error_free (error3);
|
|
}
|
|
else
|
|
{
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (items_read, ==, utf16_len);
|
|
g_assert_cmpint (items_written, ==, utf8_len);
|
|
g_assert (result);
|
|
g_assert_cmpstr (result, ==, utf8);
|
|
|
|
g_assert_no_error (error3);
|
|
g_assert (result3);
|
|
g_assert_cmpstr (result3, ==, utf8);
|
|
}
|
|
|
|
g_free (result);
|
|
g_free (result3);
|
|
}
|
|
|
|
static void
|
|
check_ucs4_to_utf16 (const gunichar *ucs4,
|
|
glong ucs4_len,
|
|
const gunichar2 *utf16,
|
|
glong utf16_len,
|
|
glong error_pos)
|
|
{
|
|
gunichar2 *result, *result2, *result3;
|
|
glong items_read, items_read2;
|
|
glong items_written, items_written2;
|
|
GError *error, *error2, *error3;
|
|
gint i;
|
|
|
|
error = NULL;
|
|
result = g_ucs4_to_utf16 (ucs4, ucs4_len, &items_read, &items_written, &error);
|
|
|
|
if (ucs4[ucs4_len] == 0)
|
|
{
|
|
/* check that len == -1 yields identical results */
|
|
error2 = NULL;
|
|
result2 = g_ucs4_to_utf16 (ucs4, -1, &items_read2, &items_written2, &error2);
|
|
|
|
g_assert (error || items_read2 == items_read);
|
|
g_assert (error || items_written2 == items_written);
|
|
g_assert_cmpint (!!result, ==, !!result2);
|
|
g_assert_cmpint (!!error, ==, !!error2);
|
|
if (result)
|
|
for (i = 0; i <= utf16_len; i++)
|
|
g_assert (result[i] == result2[i]);
|
|
|
|
g_free (result2);
|
|
if (error2)
|
|
g_error_free (error2);
|
|
}
|
|
|
|
error3 = NULL;
|
|
result3 = g_ucs4_to_utf16 (ucs4, -1, NULL, NULL, &error3);
|
|
|
|
if (error_pos)
|
|
{
|
|
g_assert (error != NULL);
|
|
g_assert (result == NULL);
|
|
g_assert_cmpint (items_read, ==, error_pos);
|
|
g_error_free (error);
|
|
|
|
g_assert (error3 != NULL);
|
|
g_assert (result3 == NULL);
|
|
g_error_free (error3);
|
|
}
|
|
else
|
|
{
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (items_read, ==, ucs4_len);
|
|
g_assert_cmpint (items_written, ==, utf16_len);
|
|
g_assert (result);
|
|
for (i = 0; i <= utf16_len; i++)
|
|
g_assert (result[i] == utf16[i]);
|
|
|
|
g_assert_no_error (error3);
|
|
g_assert (result3);
|
|
for (i = 0; i <= utf16_len; i++)
|
|
g_assert (result3[i] == utf16[i]);
|
|
}
|
|
|
|
g_free (result);
|
|
g_free (result3);
|
|
}
|
|
|
|
static void
|
|
check_utf16_to_ucs4 (const gunichar2 *utf16,
|
|
glong utf16_len,
|
|
const gunichar *ucs4,
|
|
glong ucs4_len,
|
|
glong error_pos)
|
|
{
|
|
gunichar *result, *result2, *result3;
|
|
glong items_read, items_read2;
|
|
glong items_written, items_written2;
|
|
GError *error, *error2, *error3;
|
|
gint i;
|
|
|
|
error = NULL;
|
|
result = g_utf16_to_ucs4 (utf16, utf16_len, &items_read, &items_written, &error);
|
|
if (utf16[utf16_len] == 0)
|
|
{
|
|
/* check that len == -1 yields identical results */
|
|
error2 = NULL;
|
|
result2 = g_utf16_to_ucs4 (utf16, -1, &items_read2, &items_written2, &error2);
|
|
g_assert (error || items_read2 == items_read);
|
|
g_assert (error || items_written2 == items_written);
|
|
g_assert_cmpint (!!result, ==, !!result2);
|
|
g_assert_cmpint (!!error, ==, !!error2);
|
|
if (result)
|
|
for (i = 0; i <= items_written; i++)
|
|
g_assert (result[i] == result2[i]);
|
|
|
|
g_free (result2);
|
|
if (error2)
|
|
g_error_free (error2);
|
|
}
|
|
|
|
error3 = NULL;
|
|
result3 = g_utf16_to_ucs4 (utf16, utf16_len, NULL, NULL, &error3);
|
|
|
|
if (error3 && error3->code == G_CONVERT_ERROR_PARTIAL_INPUT)
|
|
{
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (items_read, ==, error_pos);
|
|
g_assert_cmpint (items_read + 1, ==, utf16_len);
|
|
g_assert_cmpint (items_written, ==, ucs4_len);
|
|
g_assert (result);
|
|
for (i = 0; i <= items_written; i++)
|
|
g_assert (result[i] == ucs4[i]);
|
|
g_error_free (error3);
|
|
}
|
|
else if (error_pos)
|
|
{
|
|
g_assert (error != NULL);
|
|
g_assert (result == NULL);
|
|
g_assert_cmpint (items_read, ==, error_pos);
|
|
g_error_free (error);
|
|
|
|
g_assert (error3 != NULL);
|
|
g_assert (result3 == NULL);
|
|
g_error_free (error3);
|
|
}
|
|
else
|
|
{
|
|
g_assert_no_error (error);
|
|
g_assert_cmpint (items_read, ==, utf16_len);
|
|
g_assert_cmpint (items_written, ==, ucs4_len);
|
|
g_assert (result);
|
|
for (i = 0; i <= ucs4_len; i++)
|
|
g_assert (result[i] == ucs4[i]);
|
|
|
|
g_assert_no_error (error3);
|
|
g_assert (result3);
|
|
for (i = 0; i <= ucs4_len; i++)
|
|
g_assert (result3[i] == ucs4[i]);
|
|
}
|
|
|
|
g_free (result);
|
|
g_free (result3);
|
|
}
|
|
|
|
static void
|
|
test_unicode_conversions (void)
|
|
{
|
|
const char *utf8;
|
|
gunichar ucs4[100];
|
|
gunichar2 utf16[100];
|
|
|
|
utf8 = "abc";
|
|
ucs4[0] = 0x61; ucs4[1] = 0x62; ucs4[2] = 0x63; ucs4[3] = 0;
|
|
utf16[0] = 0x61; utf16[1] = 0x62; utf16[2] = 0x63; utf16[3] = 0;
|
|
|
|
check_utf8_to_ucs4 (utf8, 3, ucs4, 3, 0);
|
|
check_ucs4_to_utf8 (ucs4, 3, utf8, 3, 0);
|
|
check_utf8_to_utf16 (utf8, 3, utf16, 3, 0);
|
|
check_utf16_to_utf8 (utf16, 3, utf8, 3, 0);
|
|
check_ucs4_to_utf16 (ucs4, 3, utf16, 3, 0);
|
|
check_utf16_to_ucs4 (utf16, 3, ucs4, 3, 0);
|
|
|
|
utf8 = "\316\261\316\262\316\263";
|
|
ucs4[0] = 0x03b1; ucs4[1] = 0x03b2; ucs4[2] = 0x03b3; ucs4[3] = 0;
|
|
utf16[0] = 0x03b1; utf16[1] = 0x03b2; utf16[2] = 0x03b3; utf16[3] = 0;
|
|
|
|
check_utf8_to_ucs4 (utf8, 6, ucs4, 3, 0);
|
|
check_ucs4_to_utf8 (ucs4, 3, utf8, 6, 0);
|
|
check_utf8_to_utf16 (utf8, 6, utf16, 3, 0);
|
|
check_utf16_to_utf8 (utf16, 3, utf8, 6, 0);
|
|
check_ucs4_to_utf16 (ucs4, 3, utf16, 3, 0);
|
|
check_utf16_to_ucs4 (utf16, 3, ucs4, 3, 0);
|
|
|
|
/* partial utf8 character */
|
|
utf8 = "abc\316";
|
|
ucs4[0] = 0x61; ucs4[1] = 0x62; ucs4[2] = 0x63; ucs4[3] = 0;
|
|
utf16[0] = 0x61; utf16[1] = 0x62; utf16[2] = 0x63; utf16[3] = 0;
|
|
|
|
check_utf8_to_ucs4 (utf8, 4, ucs4, 3, 3);
|
|
check_utf8_to_utf16 (utf8, 4, utf16, 3, 3);
|
|
|
|
/* invalid utf8 */
|
|
utf8 = "abc\316\316";
|
|
ucs4[0] = 0;
|
|
utf16[0] = 0;
|
|
|
|
check_utf8_to_ucs4 (utf8, 5, ucs4, 0, 3);
|
|
check_utf8_to_utf16 (utf8, 5, utf16, 0, 3);
|
|
|
|
/* partial utf16 character */
|
|
utf8 = "ab";
|
|
ucs4[0] = 0x61; ucs4[1] = 0x62; ucs4[2] = 0;
|
|
utf16[0] = 0x61; utf16[1] = 0x62; utf16[2] = 0xd801; utf16[3] = 0;
|
|
|
|
check_utf16_to_utf8 (utf16, 3, utf8, 2, 2);
|
|
check_utf16_to_ucs4 (utf16, 3, ucs4, 2, 2);
|
|
|
|
/* invalid utf16 */
|
|
utf8 = NULL;
|
|
ucs4[0] = 0;
|
|
utf16[0] = 0x61; utf16[1] = 0x62; utf16[2] = 0xdc01; utf16[3] = 0;
|
|
|
|
check_utf16_to_utf8 (utf16, 3, utf8, 0, 2);
|
|
check_utf16_to_ucs4 (utf16, 3, ucs4, 0, 2);
|
|
|
|
/* invalid ucs4 */
|
|
utf8 = NULL;
|
|
ucs4[0] = 0x61; ucs4[1] = 0x62; ucs4[2] = 0x80000000; ucs4[3] = 0;
|
|
utf16[0] = 0;
|
|
|
|
check_ucs4_to_utf8 (ucs4, 3, utf8, 0, 2);
|
|
check_ucs4_to_utf16 (ucs4, 3, utf16, 0, 2);
|
|
}
|
|
|
|
static void
|
|
test_filename_utf8 (void)
|
|
{
|
|
const gchar *filename = "/my/path/to/foo";
|
|
gchar *utf8;
|
|
gchar *back;
|
|
GError *error;
|
|
|
|
error = NULL;
|
|
utf8 = g_filename_to_utf8 (filename, -1, NULL, NULL, &error);
|
|
g_assert_no_error (error);
|
|
back = g_filename_from_utf8 (utf8, -1, NULL, NULL, &error);
|
|
g_assert_no_error (error);
|
|
g_assert_cmpstr (back, ==, filename);
|
|
|
|
g_free (utf8);
|
|
g_free (back);
|
|
}
|
|
|
|
static void
|
|
test_filename_display (void)
|
|
{
|
|
const gchar *filename = "/my/path/to/foo";
|
|
char *display;
|
|
|
|
display = g_filename_display_basename (filename);
|
|
g_assert_cmpstr (display, ==, "foo");
|
|
|
|
g_free (display);
|
|
}
|
|
|
|
/* g_convert() should accept and produce text buffers with embedded
|
|
* nul bytes/characters.
|
|
*/
|
|
static void
|
|
test_convert_embedded_nul (void)
|
|
{
|
|
gchar *res;
|
|
gsize bytes_read, bytes_written;
|
|
GError *error = NULL;
|
|
|
|
res = g_convert ("ab\0\xf6", 4, "UTF-8", "ISO-8859-1",
|
|
&bytes_read, &bytes_written, &error);
|
|
g_assert_no_error (error);
|
|
g_assert_cmpuint (bytes_read, ==, 4);
|
|
g_assert_cmpmem (res, bytes_written, "ab\0\xc3\xb6", 5);
|
|
g_free (res);
|
|
}
|
|
|
|
static void
|
|
test_locale_to_utf8_embedded_nul (void)
|
|
{
|
|
g_test_trap_subprocess ("/conversion/locale-to-utf8/embedded-nul/subprocess/utf8", 0, 0);
|
|
g_test_trap_assert_passed ();
|
|
g_test_trap_subprocess ("/conversion/locale-to-utf8/embedded-nul/subprocess/iconv", 0, 0);
|
|
g_test_trap_assert_passed ();
|
|
}
|
|
|
|
/* Test that embedded nul characters in UTF-8 input to g_locale_to_utf8()
|
|
* result in an error.
|
|
*/
|
|
static void
|
|
test_locale_to_utf8_embedded_nul_utf8 (void)
|
|
{
|
|
gchar *res;
|
|
gsize bytes_read;
|
|
GError *error = NULL;
|
|
|
|
setlocale (LC_ALL, "");
|
|
g_setenv ("CHARSET", "UTF-8", TRUE);
|
|
g_assert_true (g_get_charset (NULL));
|
|
|
|
res = g_locale_to_utf8 ("ab\0c", 4, &bytes_read, NULL, &error);
|
|
|
|
g_assert_null (res);
|
|
g_assert_error (error, G_CONVERT_ERROR, G_CONVERT_ERROR_ILLEGAL_SEQUENCE);
|
|
g_assert_cmpuint (bytes_read, ==, 2);
|
|
g_error_free (error);
|
|
}
|
|
|
|
/* Test that embedded nul characters in output of g_locale_to_utf8(),
|
|
* when converted from non-UTF8 input, result in an error.
|
|
*/
|
|
static void
|
|
test_locale_to_utf8_embedded_nul_iconv (void)
|
|
{
|
|
gchar *res;
|
|
GError *error = NULL;
|
|
|
|
setlocale (LC_ALL, "C");
|
|
g_setenv ("CHARSET", "US-ASCII", TRUE);
|
|
g_assert_false (g_get_charset (NULL));
|
|
|
|
res = g_locale_to_utf8 ("ab\0c", 4, NULL, NULL, &error);
|
|
|
|
g_assert_null (res);
|
|
g_assert_error (error, G_CONVERT_ERROR, G_CONVERT_ERROR_EMBEDDED_NUL);
|
|
g_error_free (error);
|
|
}
|
|
|
|
static void
|
|
test_locale_from_utf8_embedded_nul (void)
|
|
{
|
|
g_test_trap_subprocess ("/conversion/locale-from-utf8/embedded-nul/subprocess/utf8", 0, 0);
|
|
g_test_trap_assert_passed ();
|
|
g_test_trap_subprocess ("/conversion/locale-from-utf8/embedded-nul/subprocess/iconv", 0, 0);
|
|
g_test_trap_assert_passed ();
|
|
}
|
|
|
|
/* Test that embedded nul characters in input to g_locale_from_utf8(),
|
|
* when converting (copying) to UTF-8 output, result in an error.
|
|
*/
|
|
static void
|
|
test_locale_from_utf8_embedded_nul_utf8 (void)
|
|
{
|
|
gchar *res;
|
|
gsize bytes_read;
|
|
GError *error = NULL;
|
|
|
|
setlocale (LC_ALL, "");
|
|
g_setenv ("CHARSET", "UTF-8", TRUE);
|
|
g_assert_true (g_get_charset (NULL));
|
|
|
|
res = g_locale_from_utf8 ("ab\0c", 4, &bytes_read, NULL, &error);
|
|
|
|
g_assert_null (res);
|
|
g_assert_error (error, G_CONVERT_ERROR, G_CONVERT_ERROR_ILLEGAL_SEQUENCE);
|
|
g_assert_cmpuint (bytes_read, ==, 2);
|
|
g_error_free (error);
|
|
}
|
|
|
|
/* Test that embedded nul characters in input to g_locale_from_utf8(),
|
|
* when converting to non-UTF-8 output, result in an error.
|
|
*/
|
|
static void
|
|
test_locale_from_utf8_embedded_nul_iconv (void)
|
|
{
|
|
gchar *res;
|
|
gsize bytes_read;
|
|
GError *error = NULL;
|
|
|
|
setlocale (LC_ALL, "C");
|
|
g_setenv ("CHARSET", "US-ASCII", TRUE);
|
|
g_assert_false (g_get_charset (NULL));
|
|
|
|
res = g_locale_from_utf8 ("ab\0c", 4, &bytes_read, NULL, &error);
|
|
|
|
g_assert_null (res);
|
|
g_assert_error (error, G_CONVERT_ERROR, G_CONVERT_ERROR_ILLEGAL_SEQUENCE);
|
|
g_assert_cmpuint (bytes_read, ==, 2);
|
|
g_error_free (error);
|
|
}
|
|
|
|
static void
|
|
test_filename_to_utf8_embedded_nul (void)
|
|
{
|
|
g_test_trap_subprocess ("/conversion/filename-to-utf8/embedded-nul/subprocess/utf8", 0, 0);
|
|
g_test_trap_assert_passed ();
|
|
g_test_trap_subprocess ("/conversion/filename-to-utf8/embedded-nul/subprocess/iconv", 0, 0);
|
|
g_test_trap_assert_passed ();
|
|
}
|
|
|
|
/* Test that embedded nul characters in UTF-8 input to g_filename_to_utf8()
|
|
* result in an error.
|
|
*/
|
|
static void
|
|
test_filename_to_utf8_embedded_nul_utf8 (void)
|
|
{
|
|
gchar *res;
|
|
gsize bytes_read;
|
|
GError *error = NULL;
|
|
|
|
g_setenv ("G_FILENAME_ENCODING", "UTF-8", TRUE);
|
|
g_assert_true (g_get_filename_charsets (NULL));
|
|
|
|
res = g_filename_to_utf8 ("ab\0c", 4, &bytes_read, NULL, &error);
|
|
|
|
g_assert_null (res);
|
|
g_assert_error (error, G_CONVERT_ERROR, G_CONVERT_ERROR_ILLEGAL_SEQUENCE);
|
|
g_assert_cmpuint (bytes_read, ==, 2);
|
|
g_error_free (error);
|
|
}
|
|
|
|
/* Test that embedded nul characters in non-UTF-8 input of g_filename_to_utf8()
|
|
* result in an error.
|
|
*/
|
|
static void
|
|
test_filename_to_utf8_embedded_nul_iconv (void)
|
|
{
|
|
gchar *res;
|
|
gsize bytes_read;
|
|
GError *error = NULL;
|
|
|
|
g_setenv ("G_FILENAME_ENCODING", "US-ASCII", TRUE);
|
|
g_assert_false (g_get_filename_charsets (NULL));
|
|
|
|
res = g_filename_to_utf8 ("ab\0c", 4, &bytes_read, NULL, &error);
|
|
|
|
g_assert_null (res);
|
|
g_assert_error (error, G_CONVERT_ERROR, G_CONVERT_ERROR_ILLEGAL_SEQUENCE);
|
|
g_assert_cmpuint (bytes_read, ==, 2);
|
|
g_error_free (error);
|
|
}
|
|
|
|
static void
|
|
test_filename_from_utf8_embedded_nul (void)
|
|
{
|
|
g_test_trap_subprocess ("/conversion/filename-from-utf8/embedded-nul/subprocess/utf8", 0, 0);
|
|
g_test_trap_assert_passed ();
|
|
g_test_trap_subprocess ("/conversion/filename-from-utf8/embedded-nul/subprocess/iconv", 0, 0);
|
|
g_test_trap_assert_passed ();
|
|
}
|
|
|
|
/* Test that embedded nul characters in input to g_filename_from_utf8(),
|
|
* when converting (copying) to UTF-8 output, result in an error.
|
|
*/
|
|
static void
|
|
test_filename_from_utf8_embedded_nul_utf8 (void)
|
|
{
|
|
gchar *res;
|
|
gsize bytes_read;
|
|
GError *error = NULL;
|
|
|
|
g_setenv ("G_FILENAME_ENCODING", "UTF-8", TRUE);
|
|
g_assert_true (g_get_filename_charsets (NULL));
|
|
|
|
res = g_filename_from_utf8 ("ab\0c", 4, &bytes_read, NULL, &error);
|
|
|
|
g_assert_null (res);
|
|
g_assert_error (error, G_CONVERT_ERROR, G_CONVERT_ERROR_ILLEGAL_SEQUENCE);
|
|
g_assert_cmpuint (bytes_read, ==, 2);
|
|
g_error_free (error);
|
|
}
|
|
|
|
/* Test that embedded nul characters in input to g_filename_from_utf8(),
|
|
* when converting to non-UTF-8 output, result in an error.
|
|
*/
|
|
static void
|
|
test_filename_from_utf8_embedded_nul_iconv (void)
|
|
{
|
|
gchar *res;
|
|
gsize bytes_read;
|
|
GError *error = NULL;
|
|
|
|
g_setenv ("G_FILENAME_ENCODING", "US-ASCII", TRUE);
|
|
g_assert_false (g_get_filename_charsets (NULL));
|
|
|
|
res = g_filename_from_utf8 ("ab\0c", 4, &bytes_read, NULL, &error);
|
|
|
|
g_assert_null (res);
|
|
g_assert_error (error, G_CONVERT_ERROR, G_CONVERT_ERROR_ILLEGAL_SEQUENCE);
|
|
g_assert_cmpuint (bytes_read, ==, 2);
|
|
g_error_free (error);
|
|
}
|
|
|
|
static void
|
|
test_no_conv (void)
|
|
{
|
|
const gchar *in = "";
|
|
gchar *out G_GNUC_UNUSED;
|
|
gsize bytes_read = 0;
|
|
gsize bytes_written = 0;
|
|
GError *error = NULL;
|
|
|
|
out = g_convert (in, -1, "XXX", "UVZ",
|
|
&bytes_read, &bytes_written, &error);
|
|
|
|
/* error code is unreliable, since we mishandle errno there */
|
|
g_assert (error && error->domain == G_CONVERT_ERROR);
|
|
g_error_free (error);
|
|
}
|
|
|
|
int
|
|
main (int argc, char *argv[])
|
|
{
|
|
g_test_init (&argc, &argv, NULL);
|
|
|
|
g_test_add_func ("/conversion/no-conv", test_no_conv);
|
|
g_test_add_func ("/conversion/iconv-state", test_iconv_state);
|
|
g_test_add_func ("/conversion/illegal-sequence", test_one_half);
|
|
g_test_add_func ("/conversion/byte-order", test_byte_order);
|
|
g_test_add_func ("/conversion/unicode", test_unicode_conversions);
|
|
g_test_add_func ("/conversion/filename-utf8", test_filename_utf8);
|
|
g_test_add_func ("/conversion/filename-display", test_filename_display);
|
|
g_test_add_func ("/conversion/convert-embedded-nul", test_convert_embedded_nul);
|
|
g_test_add_func ("/conversion/locale-to-utf8/embedded-nul", test_locale_to_utf8_embedded_nul);
|
|
g_test_add_func ("/conversion/locale-to-utf8/embedded-nul/subprocess/utf8", test_locale_to_utf8_embedded_nul_utf8);
|
|
g_test_add_func ("/conversion/locale-to-utf8/embedded-nul/subprocess/iconv", test_locale_to_utf8_embedded_nul_iconv);
|
|
g_test_add_func ("/conversion/locale-from-utf8/embedded-nul", test_locale_from_utf8_embedded_nul);
|
|
g_test_add_func ("/conversion/locale-from-utf8/embedded-nul/subprocess/utf8", test_locale_from_utf8_embedded_nul_utf8);
|
|
g_test_add_func ("/conversion/locale-from-utf8/embedded-nul/subprocess/iconv", test_locale_from_utf8_embedded_nul_iconv);
|
|
g_test_add_func ("/conversion/filename-to-utf8/embedded-nul", test_filename_to_utf8_embedded_nul);
|
|
g_test_add_func ("/conversion/filename-to-utf8/embedded-nul/subprocess/utf8", test_filename_to_utf8_embedded_nul_utf8);
|
|
g_test_add_func ("/conversion/filename-to-utf8/embedded-nul/subprocess/iconv", test_filename_to_utf8_embedded_nul_iconv);
|
|
g_test_add_func ("/conversion/filename-from-utf8/embedded-nul", test_filename_from_utf8_embedded_nul);
|
|
g_test_add_func ("/conversion/filename-from-utf8/embedded-nul/subprocess/utf8", test_filename_from_utf8_embedded_nul_utf8);
|
|
g_test_add_func ("/conversion/filename-from-utf8/embedded-nul/subprocess/iconv", test_filename_from_utf8_embedded_nul_iconv);
|
|
|
|
return g_test_run ();
|
|
}
|