/* * Copyright © 2010 Codethink Limited * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2 of the licence, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with this library; if not, write to the * Free Software Foundation, Inc., 59 Temple Place - Suite 330, * Boston, MA 02111-1307, USA. * * Author: Ryan Lortie */ #include "gvdb-reader.h" #include "gvdb-format.h" #include struct _GvdbTable { gint ref_count; const gchar *data; gsize size; GMappedFile *mapped; gboolean byteswapped; gboolean trusted; const guint32 *bloom_words; guint32 n_bloom_words; guint bloom_shift; const guint32 *hash_buckets; guint32 n_buckets; struct gvdb_hash_item *hash_items; guint32 n_hash_items; }; static const gchar * gvdb_table_item_get_key (GvdbTable *file, const struct gvdb_hash_item *item, gsize *size) { guint32 start, end; start = guint32_from_le (item->key_start); *size = guint16_from_le (item->key_size); end = start + *size; if G_UNLIKELY (start > end || end > file->size) return NULL; return file->data + start; } static gconstpointer gvdb_table_dereference (GvdbTable *file, const struct gvdb_pointer *pointer, gint alignment, gsize *size) { guint32 start, end; start = guint32_from_le (pointer->start); end = guint32_from_le (pointer->end); if G_UNLIKELY (start > end || end > file->size || start & (alignment - 1)) return NULL; *size = end - start; return file->data + start; } static void gvdb_table_setup_root (GvdbTable *file, const struct gvdb_pointer *pointer) { const struct gvdb_hash_header *header; guint32 n_bloom_words; guint32 bloom_shift; guint32 n_buckets; gsize size; header = gvdb_table_dereference (file, pointer, 4, &size); if G_UNLIKELY (header == NULL || size < sizeof *header) return; size -= sizeof *header; n_bloom_words = guint32_from_le (header->n_bloom_words); n_buckets = guint32_from_le (header->n_buckets); bloom_shift = n_bloom_words >> 27; n_bloom_words &= (1u << 27) - 1; if G_UNLIKELY (n_bloom_words * sizeof (guint32_le) > size) return; file->bloom_words = (gpointer) (header + 1); size -= n_bloom_words * sizeof (guint32_le); file->n_bloom_words = n_bloom_words; if G_UNLIKELY (n_buckets > G_MAXUINT / sizeof (guint32_le) || n_buckets * sizeof (guint32_le) > size) return; file->hash_buckets = file->bloom_words + file->n_bloom_words; size -= n_buckets * sizeof (guint32_le); file->n_buckets = n_buckets; if G_UNLIKELY (size % sizeof (struct gvdb_hash_item)) return; file->hash_items = (gpointer) (file->hash_buckets + n_buckets); file->n_hash_items = size / sizeof (struct gvdb_hash_item); } /** * gvdb_table_new: * @filename: the path to the hash file * @trusted: if the contents of @filename are trusted * @error: %NULL, or a pointer to a %NULL #GError * @returns: a new #GvdbTable * * Creates a new #GvdbTable from the contents of the file found at * @filename. * * The only time this function fails is if the file can not be opened. * In that case, the #GError that is returned will be an error from * g_mapped_file_new(). * * An empty or otherwise corrupted file is considered to be a valid * #GvdbTable with no entries. * * You should call gvdb_table_unref() on the return result when you no * longer require it. **/ GvdbTable * gvdb_table_new (const gchar *filename, gboolean trusted, GError **error) { GMappedFile *mapped; GvdbTable *file; if ((mapped = g_mapped_file_new (filename, FALSE, error)) == NULL) return NULL; file = g_slice_new0 (GvdbTable); file->data = g_mapped_file_get_contents (mapped); file->size = g_mapped_file_get_length (mapped); file->trusted = trusted; file->mapped = mapped; file->ref_count = 1; if (sizeof (struct gvdb_header) <= file->size) { const struct gvdb_header *header = (gpointer) file->data; if (header->signature[0] == GVDB_SIGNATURE0 && header->signature[1] == GVDB_SIGNATURE1 && guint32_from_le (header->version) == 0) file->byteswapped = FALSE; else if (header->signature[0] == GVDB_SWAPPED_SIGNATURE0 && header->signature[1] == GVDB_SWAPPED_SIGNATURE1 && guint32_from_le (header->version) == 0) file->byteswapped = TRUE; else { g_set_error (error, G_FILE_ERROR, G_FILE_ERROR_INVAL, "%s: invalid header", filename); g_slice_free (GvdbTable, file); g_mapped_file_unref (mapped); return NULL; } gvdb_table_setup_root (file, &header->root); } return file; } static gboolean gvdb_table_bloom_filter (GvdbTable *file, guint32 hash_value) { guint32 word, mask; if (file->n_bloom_words == 0) return TRUE; word = (hash_value / 32) % file->n_bloom_words; mask = 1 << (hash_value & 31); mask |= 1 << ((hash_value >> file->bloom_shift) & 31); return (file->bloom_words[word] & mask) == mask; } static gboolean gvdb_table_check_name (GvdbTable *file, struct gvdb_hash_item *item, const gchar *key, guint key_length) { const gchar *this_key; gsize this_size; guint32 parent; this_key = gvdb_table_item_get_key (file, item, &this_size); if G_UNLIKELY (this_key == NULL || this_size > key_length) return FALSE; key_length -= this_size; if G_UNLIKELY (memcmp (this_key, key + key_length, this_size) != 0) return FALSE; parent = guint32_from_le (item->parent); if (key_length == 0 && parent == -1) return TRUE; if G_LIKELY (parent < file->n_hash_items && this_size > 0) return gvdb_table_check_name (file, &file->hash_items[parent], key, key_length); return FALSE; } const struct gvdb_hash_item * gvdb_table_lookup (GvdbTable *file, const gchar *key, gchar type) { guint32 hash_value = 5381; guint key_length; guint32 bucket; guint32 lastno; guint32 itemno; if G_UNLIKELY (file->n_buckets == 0 || file->n_hash_items == 0) return NULL; for (key_length = 0; key[key_length]; key_length++) hash_value = (hash_value * 33) + key[key_length]; if (!gvdb_table_bloom_filter (file, hash_value)) return NULL; bucket = hash_value % file->n_buckets; itemno = file->hash_buckets[bucket]; if (bucket == file->n_buckets - 1 || (lastno = file->hash_buckets[bucket + 1]) > file->n_hash_items) lastno = file->n_hash_items; while G_LIKELY (itemno < lastno) { struct gvdb_hash_item *item = &file->hash_items[itemno]; if (hash_value == guint32_from_le (item->hash_value)) if G_LIKELY (gvdb_table_check_name (file, item, key, key_length)) if G_LIKELY (item->type == type) return item; itemno++; } return NULL; } /** * gvdb_table_list: * @file: a #GvdbTable * @key: a string * @returns: a %NULL-terminated string array * * List all of the keys that appear below @key. The nesting of keys * within the hash file is defined by the program that created the hash * file. One thing is constant: each item in the returned array can be * concatenated to @key to obtain the full name of that key. * * It is not possible to tell from this function if a given key is * itself a path, a value, or another hash table; you are expected to * know this for yourself. * * You should call g_strfreev() on the return result when you no longer * require it. **/ gchar ** gvdb_table_list (GvdbTable *file, const gchar *key) { const struct gvdb_hash_item *item; const guint32_le *list; gchar **strv; gsize size; gint i; if ((item = gvdb_table_lookup (file, key, 'L')) == NULL) return NULL; list = gvdb_table_dereference (file, &item->value.pointer, 4, &size); if G_UNLIKELY (list == NULL || size % 4) return NULL; size /= 4; strv = g_new (gchar *, size + 1); for (i = 0; i < size; i++) { guint32 itemno = guint32_from_le (list[i]); if (itemno < file->n_hash_items) { const struct gvdb_hash_item *item; const gchar *string; gsize strsize; item = file->hash_items + itemno; string = gvdb_table_item_get_key (file, item, &strsize); if (string != NULL) strv[i] = g_strndup (string, strsize); else strv[i] = g_malloc0 (1); } else strv[i] = g_malloc0 (1); } strv[i] = NULL; return strv; } /** * gvdb_table_has_value: * @file: a #GvdbTable * @key: a string * @returns: %TRUE if @key is in the table * * Checks for a value named @key in @file. * * Note: this function does not consider non-value nodes (other hash * tables, for example). **/ gboolean gvdb_table_has_value (GvdbTable *file, const gchar *key) { return gvdb_table_lookup (file, key, 'v') != NULL; } /** * gvdb_table_get_value: * @file: a #GvdbTable * @key: a string * @options: a pointer to a #GVariant, or %NULL * @returns: a #GVariant, or %NULL * * Looks up a value named @key in @file. * * If the value is not found then %NULL is returned. Otherwise, a new * #GVariant instance is returned. The #GVariant does not depend on the * continued existence of @file. * * If @options is non-%NULL then it will be set either to %NULL in the * case of no options or a #GVariant containing a dictionary mapping * strings to variants. * * You should call g_variant_unref() on the return result when you no * longer require it. **/ GVariant * gvdb_table_get_value (GvdbTable *file, const gchar *key, GVariant **options) { const struct gvdb_hash_item *item; GVariant *variant, *value; gconstpointer data; gsize size; if ((item = gvdb_table_lookup (file, key, 'v')) == NULL) return NULL; data = gvdb_table_dereference (file, &item->value.pointer, 8, &size); if G_UNLIKELY (data == NULL) return NULL; variant = g_variant_new_from_data (G_VARIANT_TYPE_VARIANT, data, size, file->trusted, (GDestroyNotify) g_mapped_file_unref, g_mapped_file_ref (file->mapped)); value = g_variant_get_variant (variant); g_variant_unref (variant); if (options != NULL) { data = gvdb_table_dereference (file, &item->options, 8, &size); if (data != NULL && size > 0) { *options = g_variant_new_from_data (G_VARIANT_TYPE ("a{sv}"), data, size, file->trusted, (GDestroyNotify) g_mapped_file_unref, g_mapped_file_ref (file->mapped)); g_variant_ref_sink (*options); } else *options = NULL; } return value; } /** * gvdb_table_get_table: * @file: a #GvdbTable * @key: a string * @returns: a new #GvdbTable, or %NULL * * Looks up the hash table named @key in @file. * * The toplevel hash table in a #GvdbTable can contain reference to * child hash tables (and those can contain further references...). * * If @key is not found in @file then %NULL is returned. Otherwise, a * new #GvdbTable is returned, referring to the child hashtable as * contained in the file. This newly-created #GvdbTable does not depend * on the continued existence of @file. * * You should call gvdb_table_unref() on the return result when you no * longer require it. **/ GvdbTable * gvdb_table_get_table (GvdbTable *file, const gchar *key) { const struct gvdb_hash_item *item; GvdbTable *new; item = gvdb_table_lookup (file, key, 'H'); if (item == NULL) return NULL; new = g_slice_new0 (GvdbTable); new->mapped = g_mapped_file_ref (file->mapped); new->byteswapped = file->byteswapped; new->trusted = file->trusted; new->data = file->data; new->size = file->size; new->ref_count = 1; gvdb_table_setup_root (new, &item->value.pointer); return new; } /** * gvdb_table_ref: * @file: a #GvdbTable * @returns: a new reference on @file * * Increases the reference count on @file. **/ GvdbTable * gvdb_table_ref (GvdbTable *file) { g_atomic_int_inc (&file->ref_count); return file; } /** * gvdb_table_unref: * @file: a #GvdbTable * * Decreases the reference count on @file, possibly freeing it. * * Since: 2.26 **/ void gvdb_table_unref (GvdbTable *file) { if (g_atomic_int_dec_and_test (&file->ref_count)) { g_mapped_file_unref (file->mapped); g_slice_free (GvdbTable, file); } }