mirror of
				https://gitlab.gnome.org/GNOME/glib.git
				synced 2025-10-25 14:32:16 +02:00 
			
		
		
		
	
		
			
				
	
	
		
			845 lines
		
	
	
		
			22 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			845 lines
		
	
	
		
			22 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| #include "cmph.h"
 | |
| #include "cmph_structs.h"
 | |
| #include "chm.h"
 | |
| #include "bmz.h" 
 | |
| #include "bmz8.h" 
 | |
| #include "brz.h" 
 | |
| #include "fch.h" 
 | |
| #include "bdz.h"
 | |
| #include "bdz_ph.h"
 | |
| #include "chd_ph.h"
 | |
| #include "chd.h"
 | |
| 
 | |
| #include <stdlib.h>
 | |
| #include <assert.h>
 | |
| #include <string.h>
 | |
| //#define DEBUG
 | |
| #include "debug.h"
 | |
| 
 | |
| const char *cmph_names[] = {"bmz", "bmz8", "chm", "brz", "fch", "bdz", "bdz_ph", "chd_ph", "chd", NULL };
 | |
| 
 | |
| typedef struct 
 | |
| {
 | |
| 	void *vector;
 | |
| 	cmph_uint32 position; // access position when data is a vector	
 | |
| } cmph_vector_t;
 | |
| 
 | |
| 
 | |
| 
 | |
| /** 
 | |
|  * Support a vector of struct as the source of keys.
 | |
|  *
 | |
|  * E.g. The keys could be the fieldB's in a vector of struct rec where 
 | |
|  * struct rec is defined as:
 | |
|  * struct rec {
 | |
|  *    fieldA;
 | |
|  *    fieldB;
 | |
|  *    fieldC;
 | |
|  * }
 | |
|  */
 | |
| typedef struct 
 | |
| {
 | |
| 	void *vector;					/* Pointer to the vector of struct */
 | |
| 	cmph_uint32 position; 			/* current position */
 | |
| 	cmph_uint32 struct_size;       	/* The size of the struct */
 | |
| 	cmph_uint32 key_offset;        	/* The byte offset of the key in the struct */
 | |
| 	cmph_uint32 key_len;          	/* The length of the key */
 | |
| } cmph_struct_vector_t;
 | |
| 
 | |
| 
 | |
| static cmph_io_adapter_t *cmph_io_vector_new(void * vector, cmph_uint32 nkeys);
 | |
| static void cmph_io_vector_destroy(cmph_io_adapter_t * key_source);
 | |
| 
 | |
| static cmph_io_adapter_t *cmph_io_struct_vector_new(void * vector, cmph_uint32 struct_size, cmph_uint32 key_offset, cmph_uint32 key_len, cmph_uint32 nkeys);
 | |
| static void cmph_io_struct_vector_destroy(cmph_io_adapter_t * key_source);
 | |
| 
 | |
| static int key_nlfile_read(void *data, char **key, cmph_uint32 *keylen)
 | |
| {
 | |
| 	FILE *fd = (FILE *)data;
 | |
| 	*key = NULL;
 | |
| 	*keylen = 0;
 | |
| 	while(1)
 | |
| 	{
 | |
| 		char buf[BUFSIZ];
 | |
| 		char *c = fgets(buf, BUFSIZ, fd); 
 | |
| 		if (c == NULL) return -1;
 | |
| 		if (feof(fd)) return -1;
 | |
| 		*key = (char *)realloc(*key, *keylen + strlen(buf) + 1);
 | |
| 		memcpy(*key + *keylen, buf, strlen(buf));
 | |
| 		*keylen += (cmph_uint32)strlen(buf);
 | |
| 		if (buf[strlen(buf) - 1] != '\n') continue;
 | |
| 		break;
 | |
| 	}
 | |
| 	if ((*keylen) && (*key)[*keylen - 1] == '\n')
 | |
| 	{
 | |
| 		(*key)[(*keylen) - 1] = 0;
 | |
| 		--(*keylen);
 | |
| 	}
 | |
| 	return (int)(*keylen);
 | |
| }
 | |
| 
 | |
| static int key_byte_vector_read(void *data, char **key, cmph_uint32 *keylen)
 | |
| {
 | |
| 	cmph_vector_t *cmph_vector = (cmph_vector_t *)data;
 | |
| 	cmph_uint8 **keys_vd = (cmph_uint8 **)cmph_vector->vector;
 | |
| 	size_t size;
 | |
| 	memcpy(keylen, keys_vd[cmph_vector->position], sizeof(*keylen));
 | |
| 	size = *keylen;
 | |
| 	*key = (char *)malloc(size);
 | |
| 	memcpy(*key, keys_vd[cmph_vector->position] + sizeof(*keylen), size);
 | |
| 	cmph_vector->position = cmph_vector->position + 1;
 | |
| 	return (int)(*keylen);
 | |
| 
 | |
| }
 | |
| 
 | |
| static int key_struct_vector_read(void *data, char **key, cmph_uint32 *keylen)
 | |
| {
 | |
|     cmph_struct_vector_t *cmph_struct_vector = (cmph_struct_vector_t *)data;
 | |
|     char *keys_vd = (char *)cmph_struct_vector->vector;
 | |
|     size_t size;
 | |
|     *keylen = cmph_struct_vector->key_len;
 | |
|     size = *keylen;
 | |
|     *key = (char *)malloc(size);
 | |
|     memcpy(*key, (keys_vd + (cmph_struct_vector->position * cmph_struct_vector->struct_size) + cmph_struct_vector->key_offset), size);
 | |
|     cmph_struct_vector->position = cmph_struct_vector->position + 1;
 | |
|     return (int)(*keylen);
 | |
| }
 | |
| 
 | |
| static int key_vector_read(void *data, char **key, cmph_uint32 *keylen)
 | |
| {
 | |
|         cmph_vector_t *cmph_vector = (cmph_vector_t *)data;
 | |
|         char **keys_vd = (char **)cmph_vector->vector;
 | |
| 	size_t size;
 | |
|         *keylen = (cmph_uint32)strlen(keys_vd[cmph_vector->position]);
 | |
| 	size = *keylen;
 | |
|         *key = (char *)malloc(size + 1);
 | |
|         strcpy(*key, keys_vd[cmph_vector->position]);
 | |
|         cmph_vector->position = cmph_vector->position + 1;
 | |
| 	return (int)(*keylen);
 | |
| 
 | |
| }
 | |
| 
 | |
| 
 | |
| static void key_nlfile_dispose(void *data, char *key, cmph_uint32 keylen)
 | |
| {
 | |
| 	free(key);
 | |
| }
 | |
| 
 | |
| static void key_vector_dispose(void *data, char *key, cmph_uint32 keylen)
 | |
| {
 | |
| 	free(key);
 | |
| }
 | |
| 
 | |
| static void key_nlfile_rewind(void *data)
 | |
| {
 | |
| 	FILE *fd = (FILE *)data;
 | |
| 	rewind(fd);
 | |
| }
 | |
| 
 | |
| static void key_struct_vector_rewind(void *data)
 | |
| {
 | |
| 	cmph_struct_vector_t *cmph_struct_vector = (cmph_struct_vector_t *)data;
 | |
| 	cmph_struct_vector->position = 0;
 | |
| }
 | |
| 
 | |
| static void key_vector_rewind(void *data)
 | |
| {
 | |
| 	cmph_vector_t *cmph_vector = (cmph_vector_t *)data;
 | |
| 	cmph_vector->position = 0;
 | |
| }
 | |
| 
 | |
| static cmph_uint32 count_nlfile_keys(FILE *fd)
 | |
| {
 | |
| 	cmph_uint32 count = 0;
 | |
| 	rewind(fd);
 | |
| 	while(1)
 | |
| 	{
 | |
| 		char buf[BUFSIZ];
 | |
| 		if (fgets(buf, BUFSIZ, fd) == NULL) break;
 | |
| 		if (feof(fd)) break;
 | |
| 		if (buf[strlen(buf) - 1] != '\n') continue;
 | |
| 		++count;
 | |
| 	}
 | |
| 	rewind(fd);
 | |
| 	return count;
 | |
| }
 | |
| 
 | |
| cmph_io_adapter_t *cmph_io_nlfile_adapter(FILE * keys_fd)
 | |
| {
 | |
|   cmph_io_adapter_t * key_source = (cmph_io_adapter_t *)malloc(sizeof(cmph_io_adapter_t));
 | |
|   assert(key_source);
 | |
|   key_source->data = (void *)keys_fd;
 | |
|   key_source->nkeys = count_nlfile_keys(keys_fd);
 | |
|   key_source->read = key_nlfile_read;
 | |
|   key_source->dispose = key_nlfile_dispose;
 | |
|   key_source->rewind = key_nlfile_rewind;
 | |
|   return key_source;
 | |
| }
 | |
| 
 | |
| void cmph_io_nlfile_adapter_destroy(cmph_io_adapter_t * key_source)
 | |
| {
 | |
| 	free(key_source);
 | |
| }
 | |
| 
 | |
| cmph_io_adapter_t *cmph_io_nlnkfile_adapter(FILE * keys_fd, cmph_uint32 nkeys)
 | |
| {
 | |
|   cmph_io_adapter_t * key_source = (cmph_io_adapter_t *)malloc(sizeof(cmph_io_adapter_t));
 | |
|   assert(key_source);
 | |
|   key_source->data = (void *)keys_fd;
 | |
|   key_source->nkeys = nkeys;
 | |
|   key_source->read = key_nlfile_read;
 | |
|   key_source->dispose = key_nlfile_dispose;
 | |
|   key_source->rewind = key_nlfile_rewind;
 | |
|   return key_source;
 | |
| }
 | |
| 
 | |
| void cmph_io_nlnkfile_adapter_destroy(cmph_io_adapter_t * key_source)
 | |
| {
 | |
| 	free(key_source);
 | |
| }
 | |
| 
 | |
| 
 | |
| static cmph_io_adapter_t *cmph_io_struct_vector_new(void * vector, cmph_uint32 struct_size, cmph_uint32 key_offset, cmph_uint32 key_len, cmph_uint32 nkeys)
 | |
| {
 | |
| 	cmph_io_adapter_t * key_source = (cmph_io_adapter_t *)malloc(sizeof(cmph_io_adapter_t));
 | |
| 	cmph_struct_vector_t * cmph_struct_vector = (cmph_struct_vector_t *)malloc(sizeof(cmph_struct_vector_t));
 | |
| 	assert(key_source);
 | |
| 	assert(cmph_struct_vector);
 | |
| 	cmph_struct_vector->vector = vector;
 | |
| 	cmph_struct_vector->position = 0;
 | |
| 	cmph_struct_vector->struct_size = struct_size;
 | |
| 	cmph_struct_vector->key_offset = key_offset;
 | |
| 	cmph_struct_vector->key_len = key_len;
 | |
| 	key_source->data = (void *)cmph_struct_vector;
 | |
| 	key_source->nkeys = nkeys;
 | |
| 	return key_source;
 | |
| }
 | |
| 
 | |
| static void cmph_io_struct_vector_destroy(cmph_io_adapter_t * key_source)
 | |
| {
 | |
| 	cmph_struct_vector_t *cmph_struct_vector = (cmph_struct_vector_t *)key_source->data;
 | |
| 	cmph_struct_vector->vector = NULL;
 | |
| 	free(cmph_struct_vector);
 | |
| 	free(key_source);
 | |
| }
 | |
| 
 | |
| static cmph_io_adapter_t *cmph_io_vector_new(void * vector, cmph_uint32 nkeys)
 | |
| {
 | |
| 	cmph_io_adapter_t * key_source = (cmph_io_adapter_t *)malloc(sizeof(cmph_io_adapter_t));
 | |
| 	cmph_vector_t * cmph_vector = (cmph_vector_t *)malloc(sizeof(cmph_vector_t));
 | |
| 	assert(key_source);
 | |
| 	assert(cmph_vector);
 | |
| 	cmph_vector->vector = vector;
 | |
| 	cmph_vector->position = 0;
 | |
| 	key_source->data = (void *)cmph_vector;
 | |
| 	key_source->nkeys = nkeys;
 | |
| 	return key_source;
 | |
| }
 | |
| 
 | |
| static void cmph_io_vector_destroy(cmph_io_adapter_t * key_source)
 | |
| {
 | |
| 	cmph_vector_t *cmph_vector = (cmph_vector_t *)key_source->data;
 | |
| 	cmph_vector->vector = NULL;
 | |
| 	free(cmph_vector);
 | |
| 	free(key_source);
 | |
| }
 | |
| 
 | |
| cmph_io_adapter_t *cmph_io_byte_vector_adapter(cmph_uint8 ** vector, cmph_uint32 nkeys)
 | |
| {
 | |
| 	cmph_io_adapter_t * key_source = cmph_io_vector_new(vector, nkeys);
 | |
| 	key_source->read = key_byte_vector_read;
 | |
| 	key_source->dispose = key_vector_dispose;
 | |
| 	key_source->rewind = key_vector_rewind;
 | |
| 	return key_source;
 | |
| }
 | |
| void cmph_io_byte_vector_adapter_destroy(cmph_io_adapter_t * key_source)
 | |
| {
 | |
| 	cmph_io_vector_destroy(key_source);
 | |
| }
 | |
| 
 | |
| cmph_io_adapter_t *cmph_io_struct_vector_adapter(void * vector, cmph_uint32 struct_size, cmph_uint32 key_offset, cmph_uint32 key_len, cmph_uint32 nkeys)
 | |
| {
 | |
| 	cmph_io_adapter_t * key_source = cmph_io_struct_vector_new(vector, struct_size, key_offset, key_len, nkeys);
 | |
| 	key_source->read = key_struct_vector_read;
 | |
| 	key_source->dispose = key_vector_dispose;
 | |
| 	key_source->rewind = key_struct_vector_rewind;
 | |
| 	return key_source;	
 | |
| }
 | |
| 
 | |
| void cmph_io_struct_vector_adapter_destroy(cmph_io_adapter_t * key_source)
 | |
| {
 | |
| 	cmph_io_struct_vector_destroy(key_source);	
 | |
| }
 | |
| 
 | |
| cmph_io_adapter_t *cmph_io_vector_adapter(char ** vector, cmph_uint32 nkeys)
 | |
| {
 | |
| 	cmph_io_adapter_t * key_source = cmph_io_vector_new(vector, nkeys);
 | |
| 	key_source->read = key_vector_read;
 | |
| 	key_source->dispose = key_vector_dispose;
 | |
| 	key_source->rewind = key_vector_rewind;
 | |
| 	return key_source;
 | |
| }
 | |
| 
 | |
| void cmph_io_vector_adapter_destroy(cmph_io_adapter_t * key_source)
 | |
| {
 | |
| 	cmph_io_vector_destroy(key_source);
 | |
| }
 | |
| 
 | |
| cmph_config_t *cmph_config_new(cmph_io_adapter_t *key_source)
 | |
| {
 | |
| 	cmph_config_t *mph = NULL;
 | |
| 	mph = __config_new(key_source);
 | |
| 	assert(mph);
 | |
| 	mph->algo = CMPH_CHM; // default value
 | |
| 	mph->data = chm_config_new();
 | |
| 	return mph;
 | |
| }
 | |
| 
 | |
| void cmph_config_set_algo(cmph_config_t *mph, CMPH_ALGO algo)
 | |
| {
 | |
| 	if (algo != mph->algo)
 | |
| 	{
 | |
| 		switch (mph->algo)
 | |
| 		{
 | |
| 			case CMPH_CHM:
 | |
| 				chm_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_BMZ:
 | |
| 				bmz_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_BMZ8:
 | |
| 				bmz8_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_BRZ:
 | |
| 				brz_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_FCH:
 | |
| 				fch_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_BDZ:
 | |
| 				bdz_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_BDZ_PH:
 | |
| 				bdz_ph_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_CHD_PH:
 | |
| 				chd_ph_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_CHD:
 | |
| 				chd_config_destroy(mph);
 | |
| 				break;
 | |
| 			default:
 | |
| 				assert(0);
 | |
| 		}
 | |
| 		switch(algo)
 | |
| 		{
 | |
| 			case CMPH_CHM:
 | |
| 				mph->data = chm_config_new();
 | |
| 				break;
 | |
| 			case CMPH_BMZ:
 | |
| 				mph->data = bmz_config_new();
 | |
| 				break;
 | |
| 			case CMPH_BMZ8:
 | |
| 				mph->data = bmz8_config_new();
 | |
| 				break;
 | |
| 			case CMPH_BRZ:
 | |
| 				mph->data = brz_config_new();
 | |
| 				break;
 | |
| 			case CMPH_FCH:
 | |
| 				mph->data = fch_config_new();
 | |
| 				break;
 | |
| 			case CMPH_BDZ:
 | |
| 				mph->data = bdz_config_new();
 | |
| 				break;
 | |
| 			case CMPH_BDZ_PH:
 | |
| 				mph->data = bdz_ph_config_new();
 | |
| 				break;
 | |
| 			case CMPH_CHD_PH:
 | |
| 				mph->data = chd_ph_config_new();
 | |
| 				break;
 | |
| 			case CMPH_CHD:
 | |
| 				mph->data = chd_config_new(mph);
 | |
| 				break;
 | |
| 			default:
 | |
| 				assert(0);
 | |
| 		}
 | |
| 	}
 | |
| 	mph->algo = algo;
 | |
| }
 | |
| 
 | |
| void cmph_config_set_tmp_dir(cmph_config_t *mph, cmph_uint8 *tmp_dir)
 | |
| {
 | |
| 	if (mph->algo == CMPH_BRZ) 
 | |
| 	{
 | |
| 		brz_config_set_tmp_dir(mph, tmp_dir);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| 
 | |
| void cmph_config_set_mphf_fd(cmph_config_t *mph, FILE *mphf_fd)
 | |
| {
 | |
| 	if (mph->algo == CMPH_BRZ) 
 | |
| 	{
 | |
| 		brz_config_set_mphf_fd(mph, mphf_fd);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| void cmph_config_set_b(cmph_config_t *mph, cmph_uint32 b)
 | |
| {
 | |
| 	if (mph->algo == CMPH_BRZ) 
 | |
| 	{
 | |
| 		brz_config_set_b(mph, b);
 | |
| 	}
 | |
| 	else if (mph->algo == CMPH_BDZ) 
 | |
| 	{
 | |
| 		bdz_config_set_b(mph, b);
 | |
| 	}
 | |
| 	else if (mph->algo == CMPH_CHD_PH) 
 | |
| 	{
 | |
| 		chd_ph_config_set_b(mph, b);
 | |
| 	}
 | |
| 	else if (mph->algo == CMPH_CHD) 
 | |
| 	{
 | |
| 		chd_config_set_b(mph, b);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| void cmph_config_set_keys_per_bin(cmph_config_t *mph, cmph_uint32 keys_per_bin)
 | |
| {
 | |
| 	if (mph->algo == CMPH_CHD_PH) 
 | |
| 	{
 | |
| 		chd_ph_config_set_keys_per_bin(mph, keys_per_bin);
 | |
| 	}
 | |
| 	else if (mph->algo == CMPH_CHD) 
 | |
| 	{
 | |
| 		chd_config_set_keys_per_bin(mph, keys_per_bin);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| void cmph_config_set_memory_availability(cmph_config_t *mph, cmph_uint32 memory_availability)
 | |
| {
 | |
| 	if (mph->algo == CMPH_BRZ) 
 | |
| 	{
 | |
| 		brz_config_set_memory_availability(mph, memory_availability);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| void cmph_config_destroy(cmph_config_t *mph)
 | |
| {
 | |
| 	if(mph)
 | |
| 	{
 | |
| 		DEBUGP("Destroying mph with algo %s\n", cmph_names[mph->algo]);
 | |
| 		switch (mph->algo)
 | |
| 		{
 | |
| 			case CMPH_CHM:
 | |
| 				chm_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_BMZ: /* included -- Fabiano */
 | |
| 				bmz_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_BMZ8: /* included -- Fabiano */
 | |
| 				bmz8_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_BRZ: /* included -- Fabiano */
 | |
| 				brz_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_FCH: /* included -- Fabiano */
 | |
| 				fch_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_BDZ: /* included -- Fabiano */
 | |
| 				bdz_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_BDZ_PH: /* included -- Fabiano */
 | |
| 				bdz_ph_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_CHD_PH: /* included -- Fabiano */
 | |
| 				chd_ph_config_destroy(mph);
 | |
| 				break;
 | |
| 			case CMPH_CHD: /* included -- Fabiano */
 | |
| 				chd_config_destroy(mph);
 | |
| 				break;
 | |
| 			default:
 | |
| 				assert(0);
 | |
| 		}
 | |
| 		__config_destroy(mph);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| void cmph_config_set_verbosity(cmph_config_t *mph, cmph_uint32 verbosity)
 | |
| {
 | |
| 	mph->verbosity = verbosity;
 | |
| }
 | |
| 
 | |
| void cmph_config_set_hashfuncs(cmph_config_t *mph, CMPH_HASH *hashfuncs)
 | |
| {
 | |
| 	switch (mph->algo)
 | |
| 	{
 | |
| 		case CMPH_CHM:
 | |
| 			chm_config_set_hashfuncs(mph, hashfuncs);
 | |
| 			break;
 | |
| 		case CMPH_BMZ: /* included -- Fabiano */
 | |
| 			bmz_config_set_hashfuncs(mph, hashfuncs);
 | |
| 			break;
 | |
| 		case CMPH_BMZ8: /* included -- Fabiano */
 | |
| 			bmz8_config_set_hashfuncs(mph, hashfuncs);
 | |
| 			break;
 | |
| 		case CMPH_BRZ: /* included -- Fabiano */
 | |
| 			brz_config_set_hashfuncs(mph, hashfuncs);
 | |
| 			break;
 | |
| 		case CMPH_FCH: /* included -- Fabiano */
 | |
| 			fch_config_set_hashfuncs(mph, hashfuncs);
 | |
| 			break;
 | |
| 		case CMPH_BDZ: /* included -- Fabiano */
 | |
| 			bdz_config_set_hashfuncs(mph, hashfuncs);
 | |
| 			break;
 | |
| 		case CMPH_BDZ_PH: /* included -- Fabiano */
 | |
| 			bdz_ph_config_set_hashfuncs(mph, hashfuncs);
 | |
| 			break;
 | |
| 		case CMPH_CHD_PH: /* included -- Fabiano */
 | |
| 			chd_ph_config_set_hashfuncs(mph, hashfuncs);
 | |
| 			break;
 | |
| 		case CMPH_CHD: /* included -- Fabiano */
 | |
| 			chd_config_set_hashfuncs(mph, hashfuncs);
 | |
| 			break;
 | |
| 		default:
 | |
| 			break;
 | |
| 	}
 | |
| 	return;
 | |
| }
 | |
| void cmph_config_set_graphsize(cmph_config_t *mph, double c)
 | |
| {
 | |
| 	mph->c = c;
 | |
| 	return;
 | |
| }
 | |
| 
 | |
| cmph_t *cmph_new(cmph_config_t *mph)
 | |
| {
 | |
| 	cmph_t *mphf = NULL;
 | |
| 	double c = mph->c;
 | |
| 
 | |
| 	DEBUGP("Creating mph with algorithm %s\n", cmph_names[mph->algo]);
 | |
| 	switch (mph->algo)	
 | |
| 	{
 | |
| 		case CMPH_CHM:
 | |
| 			DEBUGP("Creating chm hash\n");
 | |
| 			mphf = chm_new(mph, c);
 | |
| 			break;
 | |
| 		case CMPH_BMZ: /* included -- Fabiano */
 | |
| 			DEBUGP("Creating bmz hash\n");
 | |
| 			mphf = bmz_new(mph, c);
 | |
| 			break;
 | |
| 		case CMPH_BMZ8: /* included -- Fabiano */
 | |
| 			DEBUGP("Creating bmz8 hash\n");
 | |
| 			mphf = bmz8_new(mph, c);
 | |
| 			break;
 | |
| 		case CMPH_BRZ: /* included -- Fabiano */
 | |
| 			DEBUGP("Creating brz hash\n");
 | |
| 			if (c >= 2.0) brz_config_set_algo(mph, CMPH_FCH);
 | |
| 			else brz_config_set_algo(mph, CMPH_BMZ8);
 | |
| 			mphf = brz_new(mph, c);
 | |
| 			break;
 | |
| 		case CMPH_FCH: /* included -- Fabiano */
 | |
| 			DEBUGP("Creating fch hash\n");
 | |
| 			mphf = fch_new(mph, c);
 | |
| 			break;
 | |
| 		case CMPH_BDZ: /* included -- Fabiano */
 | |
| 			DEBUGP("Creating bdz hash\n");
 | |
| 			mphf = bdz_new(mph, c);
 | |
| 			break;
 | |
| 		case CMPH_BDZ_PH: /* included -- Fabiano */
 | |
| 			DEBUGP("Creating bdz_ph hash\n");
 | |
| 			mphf = bdz_ph_new(mph, c);
 | |
| 			break;
 | |
| 		case CMPH_CHD_PH: /* included -- Fabiano */
 | |
| 			DEBUGP("Creating chd_ph hash\n");
 | |
| 			mphf = chd_ph_new(mph, c);
 | |
| 			break;
 | |
| 		case CMPH_CHD: /* included -- Fabiano */
 | |
| 			DEBUGP("Creating chd hash\n");
 | |
| 			mphf = chd_new(mph, c);
 | |
| 			break;
 | |
| 		default:
 | |
| 			assert(0);
 | |
| 	}
 | |
| 	return mphf;
 | |
| }
 | |
| 
 | |
| int cmph_dump(cmph_t *mphf, FILE *f)
 | |
| {
 | |
| 	switch (mphf->algo)
 | |
| 	{
 | |
| 		case CMPH_CHM:
 | |
| 			return chm_dump(mphf, f);
 | |
| 		case CMPH_BMZ: /* included -- Fabiano */
 | |
| 			return bmz_dump(mphf, f);
 | |
| 		case CMPH_BMZ8: /* included -- Fabiano */
 | |
| 			return bmz8_dump(mphf, f);
 | |
| 		case CMPH_BRZ: /* included -- Fabiano */
 | |
| 			return brz_dump(mphf, f);
 | |
| 		case CMPH_FCH: /* included -- Fabiano */
 | |
| 			return fch_dump(mphf, f);
 | |
| 		case CMPH_BDZ: /* included -- Fabiano */
 | |
| 			return bdz_dump(mphf, f);
 | |
| 		case CMPH_BDZ_PH: /* included -- Fabiano */
 | |
| 			return bdz_ph_dump(mphf, f);
 | |
| 		case CMPH_CHD_PH: /* included -- Fabiano */
 | |
| 			return chd_ph_dump(mphf, f);
 | |
| 		case CMPH_CHD: /* included -- Fabiano */
 | |
| 			return chd_dump(mphf, f);
 | |
| 		default:
 | |
| 			assert(0);
 | |
| 	}
 | |
| 	assert(0);
 | |
| 	return 0;
 | |
| }
 | |
| cmph_t *cmph_load(FILE *f)
 | |
| {
 | |
| 	cmph_t *mphf = NULL;
 | |
| 	DEBUGP("Loading mphf generic parts\n");
 | |
| 	mphf =  __cmph_load(f);
 | |
| 	if (mphf == NULL) return NULL;
 | |
| 	DEBUGP("Loading mphf algorithm dependent parts\n");
 | |
| 
 | |
| 	switch (mphf->algo)
 | |
| 	{
 | |
| 		case CMPH_CHM:
 | |
| 			chm_load(f, mphf);
 | |
| 			break;
 | |
| 		case CMPH_BMZ: /* included -- Fabiano */
 | |
| 			DEBUGP("Loading bmz algorithm dependent parts\n");
 | |
| 			bmz_load(f, mphf);
 | |
| 			break;
 | |
| 		case CMPH_BMZ8: /* included -- Fabiano */
 | |
| 			DEBUGP("Loading bmz8 algorithm dependent parts\n");
 | |
| 			bmz8_load(f, mphf);
 | |
| 			break;
 | |
| 		case CMPH_BRZ: /* included -- Fabiano */
 | |
| 			DEBUGP("Loading brz algorithm dependent parts\n");
 | |
| 			brz_load(f, mphf);
 | |
| 			break;
 | |
| 		case CMPH_FCH: /* included -- Fabiano */
 | |
| 			DEBUGP("Loading fch algorithm dependent parts\n");
 | |
| 			fch_load(f, mphf);
 | |
| 			break;
 | |
| 		case CMPH_BDZ: /* included -- Fabiano */
 | |
| 			DEBUGP("Loading bdz algorithm dependent parts\n");
 | |
| 			bdz_load(f, mphf);
 | |
| 			break;
 | |
| 		case CMPH_BDZ_PH: /* included -- Fabiano */
 | |
| 			DEBUGP("Loading bdz_ph algorithm dependent parts\n");
 | |
| 			bdz_ph_load(f, mphf);
 | |
| 			break;
 | |
| 		case CMPH_CHD_PH: /* included -- Fabiano */
 | |
| 			DEBUGP("Loading chd_ph algorithm dependent parts\n");
 | |
| 			chd_ph_load(f, mphf);
 | |
| 			break;
 | |
| 		case CMPH_CHD: /* included -- Fabiano */
 | |
| 			DEBUGP("Loading chd algorithm dependent parts\n");
 | |
| 			chd_load(f, mphf);
 | |
| 			break;
 | |
| 		default:
 | |
| 			assert(0);
 | |
| 	}
 | |
| 	DEBUGP("Loaded mphf\n");
 | |
| 	return mphf;
 | |
| }
 | |
| 
 | |
| 
 | |
| cmph_uint32 cmph_search(cmph_t *mphf, const char *key, cmph_uint32 keylen)
 | |
| {
 | |
|    	DEBUGP("mphf algorithm: %u \n", mphf->algo);
 | |
| 	switch(mphf->algo)
 | |
| 	{
 | |
| 		case CMPH_CHM:
 | |
| 			return chm_search(mphf, key, keylen);
 | |
| 		case CMPH_BMZ: /* included -- Fabiano */
 | |
| 		        DEBUGP("bmz algorithm search\n");		         
 | |
| 		        return bmz_search(mphf, key, keylen);
 | |
| 		case CMPH_BMZ8: /* included -- Fabiano */
 | |
| 		        DEBUGP("bmz8 algorithm search\n");		         
 | |
| 		        return bmz8_search(mphf, key, keylen);
 | |
| 		case CMPH_BRZ: /* included -- Fabiano */
 | |
| 		        DEBUGP("brz algorithm search\n");		         
 | |
| 		        return brz_search(mphf, key, keylen);
 | |
| 		case CMPH_FCH: /* included -- Fabiano */
 | |
| 		        DEBUGP("fch algorithm search\n");		         
 | |
| 		        return fch_search(mphf, key, keylen);
 | |
| 		case CMPH_BDZ: /* included -- Fabiano */
 | |
| 		        DEBUGP("bdz algorithm search\n");		         
 | |
| 		        return bdz_search(mphf, key, keylen);
 | |
| 		case CMPH_BDZ_PH: /* included -- Fabiano */
 | |
| 		        DEBUGP("bdz_ph algorithm search\n");		         
 | |
| 		        return bdz_ph_search(mphf, key, keylen);
 | |
| 		case CMPH_CHD_PH: /* included -- Fabiano */
 | |
| 		        DEBUGP("chd_ph algorithm search\n");		         
 | |
| 		        return chd_ph_search(mphf, key, keylen);
 | |
| 		case CMPH_CHD: /* included -- Fabiano */
 | |
| 		        DEBUGP("chd algorithm search\n");		         
 | |
| 		        return chd_search(mphf, key, keylen);
 | |
| 		default:
 | |
| 			assert(0);
 | |
| 	}
 | |
| 	assert(0);
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| cmph_uint32 cmph_size(cmph_t *mphf)
 | |
| {
 | |
| 	return mphf->size;
 | |
| }
 | |
| 	
 | |
| void cmph_destroy(cmph_t *mphf)
 | |
| {
 | |
| 	switch(mphf->algo)
 | |
| 	{
 | |
| 		case CMPH_CHM:
 | |
| 			chm_destroy(mphf);
 | |
| 			return;
 | |
| 		case CMPH_BMZ: /* included -- Fabiano */
 | |
| 			bmz_destroy(mphf);
 | |
| 			return;
 | |
| 		case CMPH_BMZ8: /* included -- Fabiano */
 | |
| 			bmz8_destroy(mphf);
 | |
| 			return;
 | |
| 		case CMPH_BRZ: /* included -- Fabiano */
 | |
| 			brz_destroy(mphf);
 | |
| 			return;
 | |
| 		case CMPH_FCH: /* included -- Fabiano */
 | |
| 			fch_destroy(mphf);
 | |
| 			return;
 | |
| 		case CMPH_BDZ: /* included -- Fabiano */
 | |
| 			bdz_destroy(mphf);
 | |
| 			return;
 | |
| 		case CMPH_BDZ_PH: /* included -- Fabiano */
 | |
| 			bdz_ph_destroy(mphf);
 | |
| 			return;
 | |
| 		case CMPH_CHD_PH: /* included -- Fabiano */
 | |
| 			chd_ph_destroy(mphf);
 | |
| 			return;
 | |
| 		case CMPH_CHD: /* included -- Fabiano */
 | |
| 			chd_destroy(mphf);
 | |
| 			return;
 | |
| 		default: 
 | |
| 			assert(0);
 | |
| 	}
 | |
| 	assert(0);
 | |
| 	return;
 | |
| }
 | |
| 
 | |
| 
 | |
| /** \fn void cmph_pack(cmph_t *mphf, void *packed_mphf);
 | |
|  *  \brief Support the ability to pack a perfect hash function into a preallocated contiguous memory space pointed by packed_mphf.
 | |
|  *  \param mphf pointer to the resulting mphf
 | |
|  *  \param packed_mphf pointer to the contiguous memory area used to store the resulting mphf. The size of packed_mphf must be at least cmph_packed_size() 
 | |
|  */
 | |
| void cmph_pack(cmph_t *mphf, void *packed_mphf)
 | |
| {
 | |
| 	// packing algorithm type to be used in cmph.c
 | |
| 	cmph_uint32 * ptr = (cmph_uint32 *) packed_mphf; 
 | |
| 	*ptr++ = mphf->algo;
 | |
| 	DEBUGP("mphf->algo = %u\n", mphf->algo);
 | |
| 	switch(mphf->algo)
 | |
| 	{
 | |
| 		case CMPH_CHM:
 | |
| 			chm_pack(mphf, ptr);
 | |
| 			break;
 | |
| 		case CMPH_BMZ: /* included -- Fabiano */
 | |
| 			bmz_pack(mphf, ptr);
 | |
| 			break;
 | |
| 		case CMPH_BMZ8: /* included -- Fabiano */
 | |
| 			bmz8_pack(mphf, ptr);
 | |
| 			break;
 | |
| 		case CMPH_BRZ: /* included -- Fabiano */
 | |
| 			brz_pack(mphf, ptr);
 | |
| 			break;
 | |
| 		case CMPH_FCH: /* included -- Fabiano */
 | |
| 			fch_pack(mphf, ptr);
 | |
| 			break;
 | |
| 		case CMPH_BDZ: /* included -- Fabiano */
 | |
| 			bdz_pack(mphf, ptr);
 | |
| 			break;
 | |
| 		case CMPH_BDZ_PH: /* included -- Fabiano */
 | |
| 			bdz_ph_pack(mphf, ptr);
 | |
| 			break;
 | |
| 		case CMPH_CHD_PH: /* included -- Fabiano */
 | |
| 			chd_ph_pack(mphf, ptr);
 | |
| 			break;
 | |
| 		case CMPH_CHD: /* included -- Fabiano */
 | |
| 			chd_pack(mphf, ptr);
 | |
| 			break;
 | |
| 		default: 
 | |
| 			assert(0);
 | |
| 	}
 | |
| 	return;
 | |
| }
 | |
| 
 | |
| /** \fn cmph_uint32 cmph_packed_size(cmph_t *mphf);
 | |
|  *  \brief Return the amount of space needed to pack mphf.
 | |
|  *  \param mphf pointer to a mphf
 | |
|  *  \return the size of the packed function or zero for failures
 | |
|  */ 
 | |
| cmph_uint32 cmph_packed_size(cmph_t *mphf)
 | |
| {
 | |
| 	switch(mphf->algo)
 | |
| 	{
 | |
| 		case CMPH_CHM:
 | |
| 			return chm_packed_size(mphf);
 | |
| 		case CMPH_BMZ: /* included -- Fabiano */
 | |
| 			return bmz_packed_size(mphf);
 | |
| 		case CMPH_BMZ8: /* included -- Fabiano */
 | |
| 			return bmz8_packed_size(mphf);
 | |
| 		case CMPH_BRZ: /* included -- Fabiano */
 | |
| 			return brz_packed_size(mphf);
 | |
| 		case CMPH_FCH: /* included -- Fabiano */
 | |
| 			return fch_packed_size(mphf);
 | |
| 		case CMPH_BDZ: /* included -- Fabiano */
 | |
| 			return bdz_packed_size(mphf);
 | |
| 		case CMPH_BDZ_PH: /* included -- Fabiano */
 | |
| 			return bdz_ph_packed_size(mphf);
 | |
| 		case CMPH_CHD_PH: /* included -- Fabiano */
 | |
| 			return chd_ph_packed_size(mphf);
 | |
| 		case CMPH_CHD: /* included -- Fabiano */
 | |
| 			return chd_packed_size(mphf);
 | |
| 		default: 
 | |
| 			assert(0);
 | |
| 	}
 | |
| 	return 0; // FAILURE
 | |
| }
 | |
| 
 | |
| /** cmph_uint32 cmph_search(void *packed_mphf, const char *key, cmph_uint32 keylen);
 | |
|  *  \brief Use the packed mphf to do a search. 
 | |
|  *  \param  packed_mphf pointer to the packed mphf
 | |
|  *  \param key key to be hashed
 | |
|  *  \param keylen key length in bytes
 | |
|  *  \return The mphf value
 | |
|  */
 | |
| cmph_uint32 cmph_search_packed(void *packed_mphf, const char *key, cmph_uint32 keylen)
 | |
| {
 | |
| 	cmph_uint32 *ptr = (cmph_uint32 *)packed_mphf;
 | |
| //	fprintf(stderr, "algo:%u\n", *ptr);
 | |
| 	switch(*ptr)
 | |
| 	{
 | |
| 		case CMPH_CHM:
 | |
| 			return chm_search_packed(++ptr, key, keylen);
 | |
| 		case CMPH_BMZ: /* included -- Fabiano */
 | |
| 			return bmz_search_packed(++ptr, key, keylen);
 | |
| 		case CMPH_BMZ8: /* included -- Fabiano */
 | |
| 			return bmz8_search_packed(++ptr, key, keylen);
 | |
| 		case CMPH_BRZ: /* included -- Fabiano */
 | |
| 			return brz_search_packed(++ptr, key, keylen);
 | |
| 		case CMPH_FCH: /* included -- Fabiano */
 | |
| 			return fch_search_packed(++ptr, key, keylen);
 | |
| 		case CMPH_BDZ: /* included -- Fabiano */
 | |
| 			return bdz_search_packed(++ptr, key, keylen);
 | |
| 		case CMPH_BDZ_PH: /* included -- Fabiano */
 | |
| 			return bdz_ph_search_packed(++ptr, key, keylen);
 | |
| 		case CMPH_CHD_PH: /* included -- Fabiano */
 | |
| 			return chd_ph_search_packed(++ptr, key, keylen);
 | |
| 		case CMPH_CHD: /* included -- Fabiano */
 | |
| 			return chd_search_packed(++ptr, key, keylen);
 | |
| 		default: 
 | |
| 			assert(0);
 | |
| 	}
 | |
| 	return 0; // FAILURE
 | |
| }
 |