Merge branch 'wip/pwithnall/backport-3373-file-load-4gb-glib-2-80' into 'glib-2-80'

Backport !3373 and !4117 “Handle files >4GB in g_file_load_contents()“ to glib-2-80

See merge request GNOME/glib!4118
This commit is contained in:
Michael Catanzaro 2024-06-18 22:09:21 +00:00
commit 5d70340412
3 changed files with 210 additions and 27 deletions

View File

@ -7933,7 +7933,8 @@ g_file_load_contents (GFile *file,
GError **error) GError **error)
{ {
GFileInputStream *in; GFileInputStream *in;
GByteArray *content; char *data;
gsize size;
gsize pos; gsize pos;
gssize res; gssize res;
GFileInfo *info; GFileInfo *info;
@ -7945,17 +7946,22 @@ g_file_load_contents (GFile *file,
if (in == NULL) if (in == NULL)
return FALSE; return FALSE;
content = g_byte_array_new (); size = GET_CONTENT_BLOCK_SIZE;
data = g_malloc (GET_CONTENT_BLOCK_SIZE);
pos = 0; pos = 0;
g_byte_array_set_size (content, pos + GET_CONTENT_BLOCK_SIZE + 1);
while ((res = g_input_stream_read (G_INPUT_STREAM (in), while ((res = g_input_stream_read (G_INPUT_STREAM (in),
content->data + pos, data + pos,
GET_CONTENT_BLOCK_SIZE, GET_CONTENT_BLOCK_SIZE,
cancellable, error)) > 0) cancellable, error)) > 0)
{ {
pos += res; pos += res;
g_byte_array_set_size (content, pos + GET_CONTENT_BLOCK_SIZE + 1); if (size - pos < GET_CONTENT_BLOCK_SIZE)
{
g_assert (size <= G_MAXSIZE / 2);
size *= 2;
data = g_realloc (data, size);
}
} }
if (etag_out) if (etag_out)
@ -7980,17 +7986,19 @@ g_file_load_contents (GFile *file,
if (res < 0) if (res < 0)
{ {
/* error is set already */ /* error is set already */
g_byte_array_free (content, TRUE); g_free (data);
return FALSE; return FALSE;
} }
if (length) if (length)
*length = pos; *length = pos;
/* Zero terminate (we got an extra byte allocated for this */ /* Zero terminate (allocating extra bytes if needed) */
content->data[pos] = 0; if (pos >= size)
data = g_realloc (data, pos + 1);
data[pos] = 0;
*contents = (char *)g_byte_array_free (content, FALSE); *contents = g_steal_pointer (&data);
return TRUE; return TRUE;
} }
@ -7998,7 +8006,8 @@ g_file_load_contents (GFile *file,
typedef struct { typedef struct {
GTask *task; GTask *task;
GFileReadMoreCallback read_more_callback; GFileReadMoreCallback read_more_callback;
GByteArray *content; char *data;
gsize size;
gsize pos; gsize pos;
char *etag; char *etag;
} LoadContentsData; } LoadContentsData;
@ -8007,12 +8016,31 @@ typedef struct {
static void static void
load_contents_data_free (LoadContentsData *data) load_contents_data_free (LoadContentsData *data)
{ {
if (data->content) g_clear_pointer (&data->data, g_free);
g_byte_array_free (data->content, TRUE);
g_free (data->etag); g_free (data->etag);
g_free (data); g_free (data);
} }
static void
load_contents_data_ensure_space (LoadContentsData *data,
gsize space)
{
if (data->size - data->pos < space)
{
if (data->data == NULL)
{
data->size = space;
data->data = g_malloc (space);
}
else
{
g_assert (data->size <= G_MAXSIZE / 2);
data->size *= 2;
data->data = g_realloc (data->data, data->size);
}
}
}
static void static void
load_contents_close_callback (GObject *obj, load_contents_close_callback (GObject *obj,
GAsyncResult *close_res, GAsyncResult *close_res,
@ -8085,12 +8113,10 @@ load_contents_read_callback (GObject *obj,
{ {
data->pos += read_size; data->pos += read_size;
g_byte_array_set_size (data->content, load_contents_data_ensure_space (data, GET_CONTENT_BLOCK_SIZE);
data->pos + GET_CONTENT_BLOCK_SIZE);
if (data->read_more_callback && if (data->read_more_callback &&
!data->read_more_callback ((char *)data->content->data, data->pos, !data->read_more_callback (data->data, data->pos,
g_async_result_get_user_data (G_ASYNC_RESULT (data->task)))) g_async_result_get_user_data (G_ASYNC_RESULT (data->task))))
g_file_input_stream_query_info_async (G_FILE_INPUT_STREAM (stream), g_file_input_stream_query_info_async (G_FILE_INPUT_STREAM (stream),
G_FILE_ATTRIBUTE_ETAG_VALUE, G_FILE_ATTRIBUTE_ETAG_VALUE,
@ -8100,7 +8126,7 @@ load_contents_read_callback (GObject *obj,
data); data);
else else
g_input_stream_read_async (stream, g_input_stream_read_async (stream,
data->content->data + data->pos, data->data + data->pos,
GET_CONTENT_BLOCK_SIZE, GET_CONTENT_BLOCK_SIZE,
0, 0,
g_task_get_cancellable (data->task), g_task_get_cancellable (data->task),
@ -8123,10 +8149,9 @@ load_contents_open_callback (GObject *obj,
if (stream) if (stream)
{ {
g_byte_array_set_size (data->content, load_contents_data_ensure_space (data, GET_CONTENT_BLOCK_SIZE);
data->pos + GET_CONTENT_BLOCK_SIZE);
g_input_stream_read_async (G_INPUT_STREAM (stream), g_input_stream_read_async (G_INPUT_STREAM (stream),
data->content->data + data->pos, data->data + data->pos,
GET_CONTENT_BLOCK_SIZE, GET_CONTENT_BLOCK_SIZE,
0, 0,
g_task_get_cancellable (data->task), g_task_get_cancellable (data->task),
@ -8176,7 +8201,6 @@ g_file_load_partial_contents_async (GFile *file,
data = g_new0 (LoadContentsData, 1); data = g_new0 (LoadContentsData, 1);
data->read_more_callback = read_more_callback; data->read_more_callback = read_more_callback;
data->content = g_byte_array_new ();
data->task = g_task_new (file, cancellable, callback, user_data); data->task = g_task_new (file, cancellable, callback, user_data);
g_task_set_source_tag (data->task, g_file_load_partial_contents_async); g_task_set_source_tag (data->task, g_file_load_partial_contents_async);
@ -8245,11 +8269,10 @@ g_file_load_partial_contents_finish (GFile *file,
} }
/* Zero terminate */ /* Zero terminate */
g_byte_array_set_size (data->content, data->pos + 1); load_contents_data_ensure_space (data, 1);
data->content->data[data->pos] = 0; data->data[data->pos] = 0;
*contents = (char *)g_byte_array_free (data->content, FALSE); *contents = g_steal_pointer (&data->data);
data->content = NULL;
return TRUE; return TRUE;
} }

View File

@ -6,6 +6,7 @@
#include <stdlib.h> #include <stdlib.h>
#include <gio/gio.h> #include <gio/gio.h>
#include <gio/gfiledescriptorbased.h> #include <gio/gfiledescriptorbased.h>
#include <glib/gstdio.h>
#ifdef G_OS_UNIX #ifdef G_OS_UNIX
#include <sys/stat.h> #include <sys/stat.h>
#endif #endif
@ -2742,7 +2743,8 @@ test_load_bytes (void)
len = strlen ("test_load_bytes"); len = strlen ("test_load_bytes");
ret = write (fd, "test_load_bytes", len); ret = write (fd, "test_load_bytes", len);
g_assert_cmpint (ret, ==, len); g_assert_cmpint (ret, ==, len);
close (fd); g_clear_fd (&fd, &error);
g_assert_no_error (error);
file = g_file_new_for_path (filename); file = g_file_new_for_path (filename);
bytes = g_file_load_bytes (file, NULL, NULL, &error); bytes = g_file_load_bytes (file, NULL, NULL, &error);
@ -2785,6 +2787,7 @@ test_load_bytes_async (void)
{ {
LoadBytesAsyncData data = { 0 }; LoadBytesAsyncData data = { 0 };
gchar filename[] = "g_file_load_bytes_XXXXXX"; gchar filename[] = "g_file_load_bytes_XXXXXX";
GError *error = NULL;
int len; int len;
int fd; int fd;
int ret; int ret;
@ -2794,7 +2797,8 @@ test_load_bytes_async (void)
len = strlen ("test_load_bytes_async"); len = strlen ("test_load_bytes_async");
ret = write (fd, "test_load_bytes_async", len); ret = write (fd, "test_load_bytes_async", len);
g_assert_cmpint (ret, ==, len); g_assert_cmpint (ret, ==, len);
close (fd); g_clear_fd (&fd, &error);
g_assert_no_error (error);
data.main_loop = g_main_loop_new (NULL, FALSE); data.main_loop = g_main_loop_new (NULL, FALSE);
data.file = g_file_new_for_path (filename); data.file = g_file_new_for_path (filename);
@ -2811,6 +2815,158 @@ test_load_bytes_async (void)
g_main_loop_unref (data.main_loop); g_main_loop_unref (data.main_loop);
} }
#if GLIB_SIZEOF_SIZE_T > 4
static const gsize testfile_4gb_size = ((gsize) 1 << 32) + (1 << 16); /* 4GB + a bit */
#else
/* Have to make do with something smaller on 32-bit platforms */
static const gsize testfile_4gb_size = G_MAXSIZE;
#endif
/* @filename will be modified as per g_mkstemp() */
static gboolean
create_testfile_4gb_or_skip (char *filename)
{
GError *error = NULL;
int fd;
int ret;
/* Reading each 4GB test file takes about 5s on a fast machine, and another 7s
* to compare its contents once its been read. Thats too slow for a normal
* test run, and theres no way to speed it up. */
if (!g_test_slow ())
{
g_test_skip ("Skipping slow >4GB file test");
return FALSE;
}
fd = g_mkstemp (filename);
g_assert_cmpint (fd, !=, -1);
ret = ftruncate (fd, testfile_4gb_size);
g_clear_fd (&fd, &error);
g_assert_no_error (error);
if (ret == 1)
{
g_test_skip ("Could not create testfile >4GB");
g_assert_no_errno (g_unlink (filename));
return FALSE;
}
return TRUE;
}
static void
check_testfile_4gb_contents (const char *data,
gsize len)
{
gsize i;
g_assert_nonnull (data);
g_assert_cmpuint (testfile_4gb_size, ==, len);
for (i = 0; i < testfile_4gb_size; i++)
{
if (data[i] != 0)
break;
}
g_assert_cmpint (i, ==, testfile_4gb_size);
}
static void
test_load_contents_4gb (void)
{
char filename[] = "g_file_load_contents_4gb_XXXXXX";
GError *error = NULL;
gboolean result;
char *data;
gsize len;
GFile *file;
if (!create_testfile_4gb_or_skip (filename))
return;
file = g_file_new_for_path (filename);
result = g_file_load_contents (file, NULL, &data, &len, NULL, &error);
g_assert_no_error (error);
g_assert_true (result);
check_testfile_4gb_contents (data, len);
g_file_delete (file, NULL, NULL);
g_free (data);
g_object_unref (file);
}
static void
load_contents_4gb_cb (GObject *object,
GAsyncResult *result,
gpointer user_data)
{
GAsyncResult **result_out = user_data;
g_assert (*result_out == NULL);
*result_out = g_object_ref (result);
g_main_context_wakeup (NULL);
}
static void
test_load_contents_4gb_async (void)
{
char filename[] = "g_file_load_contents_4gb_async_XXXXXX";
GFile *file;
GAsyncResult *async_result = NULL;
GError *error = NULL;
char *data;
gsize len;
gboolean ret;
if (!create_testfile_4gb_or_skip (filename))
return;
file = g_file_new_for_path (filename);
g_file_load_contents_async (file, NULL, load_contents_4gb_cb, &async_result);
while (async_result == NULL)
g_main_context_iteration (NULL, TRUE);
ret = g_file_load_contents_finish (file, async_result, &data, &len, NULL, &error);
g_assert_no_error (error);
g_assert_true (ret);
check_testfile_4gb_contents (data, len);
g_file_delete (file, NULL, NULL);
g_free (data);
g_object_unref (async_result);
g_object_unref (file);
}
static void
test_load_bytes_4gb (void)
{
char filename[] = "g_file_load_bytes_4gb_XXXXXX";
GError *error = NULL;
GBytes *bytes;
GFile *file;
if (!create_testfile_4gb_or_skip (filename))
return;
file = g_file_new_for_path (filename);
bytes = g_file_load_bytes (file, NULL, NULL, &error);
g_assert_no_error (error);
g_assert_true (bytes);
check_testfile_4gb_contents (g_bytes_get_data (bytes, NULL), g_bytes_get_size (bytes));
g_file_delete (file, NULL, NULL);
g_bytes_unref (bytes);
g_object_unref (file);
}
static void static void
test_writev_helper (GOutputVector *vectors, test_writev_helper (GOutputVector *vectors,
gsize n_vectors, gsize n_vectors,
@ -4032,6 +4188,9 @@ main (int argc, char *argv[])
g_test_add_func ("/file/measure-async", test_measure_async); g_test_add_func ("/file/measure-async", test_measure_async);
g_test_add_func ("/file/load-bytes", test_load_bytes); g_test_add_func ("/file/load-bytes", test_load_bytes);
g_test_add_func ("/file/load-bytes-async", test_load_bytes_async); g_test_add_func ("/file/load-bytes-async", test_load_bytes_async);
g_test_add_func ("/file/load-bytes-4gb", test_load_bytes_4gb);
g_test_add_func ("/file/load-contents-4gb", test_load_contents_4gb);
g_test_add_func ("/file/load-contents-4gb-async", test_load_contents_4gb_async);
g_test_add_func ("/file/writev", test_writev); g_test_add_func ("/file/writev", test_writev);
g_test_add_func ("/file/writev/no-bytes-written", test_writev_no_bytes_written); g_test_add_func ("/file/writev/no-bytes-written", test_writev_no_bytes_written);
g_test_add_func ("/file/writev/no-vectors", test_writev_no_vectors); g_test_add_func ("/file/writev/no-vectors", test_writev_no_vectors);

View File

@ -1068,6 +1068,7 @@ g_array_maybe_expand (GRealArray *array,
if (want_len > array->elt_capacity) if (want_len > array->elt_capacity)
{ {
gsize want_alloc = g_nearest_pow (g_array_elt_len (array, want_len)); gsize want_alloc = g_nearest_pow (g_array_elt_len (array, want_len));
g_assert (want_alloc >= g_array_elt_len (array, want_len));
want_alloc = MAX (want_alloc, MIN_ARRAY_SIZE); want_alloc = MAX (want_alloc, MIN_ARRAY_SIZE);
array->data = g_realloc (array->data, want_alloc); array->data = g_realloc (array->data, want_alloc);