turbonss/src/cmph.c

850 lines
22 KiB
C
Raw Normal View History

2004-12-23 15:16:30 +02:00
#include "cmph.h"
#include "cmph_structs.h"
2005-01-25 23:06:58 +02:00
#include "chm.h"
#include "bmz.h"
#include "bmz8.h"
#include "brz.h"
#include "fch.h"
2009-07-05 06:17:36 +03:00
#include "bdz.h"
#include "bdz_ph.h"
#include "chd_ph.h"
#include "chd.h"
2004-12-23 15:16:30 +02:00
#include <stdlib.h>
#include <assert.h>
#include <string.h>
2011-02-16 06:46:05 +02:00
// #define DEBUG
2004-12-23 15:16:30 +02:00
#include "debug.h"
2009-07-05 06:17:36 +03:00
const char *cmph_names[] = {"bmz", "bmz8", "chm", "brz", "fch", "bdz", "bdz_ph", "chd_ph", "chd", NULL };
2004-12-23 15:16:30 +02:00
2011-12-26 23:12:24 +02:00
typedef struct
2005-10-10 20:43:21 +03:00
{
void *vector;
2011-12-26 23:12:24 +02:00
cmph_uint32 position; // access position when data is a vector
2005-10-10 20:43:21 +03:00
} cmph_vector_t;
2008-03-30 02:23:41 +02:00
2011-12-26 23:12:24 +02:00
/**
2008-03-30 02:23:41 +02:00
* Support a vector of struct as the source of keys.
*
2011-12-26 23:12:24 +02:00
* E.g. The keys could be the fieldB's in a vector of struct rec where
2008-03-30 02:23:41 +02:00
* struct rec is defined as:
* struct rec {
* fieldA;
* fieldB;
* fieldC;
* }
*/
2011-12-26 23:12:24 +02:00
typedef struct
2008-03-30 02:23:41 +02:00
{
void *vector; /* Pointer to the vector of struct */
cmph_uint32 position; /* current position */
cmph_uint32 struct_size; /* The size of the struct */
cmph_uint32 key_offset; /* The byte offset of the key in the struct */
cmph_uint32 key_len; /* The length of the key */
} cmph_struct_vector_t;
2005-10-10 20:43:21 +03:00
static cmph_io_adapter_t *cmph_io_vector_new(void * vector, cmph_uint32 nkeys);
static void cmph_io_vector_destroy(cmph_io_adapter_t * key_source);
2005-07-26 00:26:17 +03:00
2008-03-30 02:23:41 +02:00
static cmph_io_adapter_t *cmph_io_struct_vector_new(void * vector, cmph_uint32 struct_size, cmph_uint32 key_offset, cmph_uint32 key_len, cmph_uint32 nkeys);
static void cmph_io_struct_vector_destroy(cmph_io_adapter_t * key_source);
2005-01-24 22:25:58 +02:00
static int key_nlfile_read(void *data, char **key, cmph_uint32 *keylen)
{
FILE *fd = (FILE *)data;
*key = NULL;
*keylen = 0;
while(1)
{
char buf[BUFSIZ];
2011-12-26 23:12:24 +02:00
char *c = fgets(buf, BUFSIZ, fd);
2005-01-24 22:25:58 +02:00
if (c == NULL) return -1;
if (feof(fd)) return -1;
*key = (char *)realloc(*key, *keylen + strlen(buf) + 1);
memcpy(*key + *keylen, buf, strlen(buf));
*keylen += (cmph_uint32)strlen(buf);
if (buf[strlen(buf) - 1] != '\n') continue;
break;
}
if ((*keylen) && (*key)[*keylen - 1] == '\n')
{
(*key)[(*keylen) - 1] = 0;
--(*keylen);
}
return (int)(*keylen);
2005-01-24 22:25:58 +02:00
}
static int key_byte_vector_read(void *data, char **key, cmph_uint32 *keylen)
2005-07-26 00:26:17 +03:00
{
cmph_vector_t *cmph_vector = (cmph_vector_t *)data;
cmph_uint8 **keys_vd = (cmph_uint8 **)cmph_vector->vector;
2008-04-12 09:17:21 +03:00
size_t size;
memcpy(keylen, keys_vd[cmph_vector->position], sizeof(*keylen));
2008-04-12 09:17:21 +03:00
size = *keylen;
*key = (char *)malloc(size);
memcpy(*key, keys_vd[cmph_vector->position] + sizeof(*keylen), size);
2005-10-10 20:43:21 +03:00
cmph_vector->position = cmph_vector->position + 1;
return (int)(*keylen);
}
2008-03-30 02:23:41 +02:00
static int key_struct_vector_read(void *data, char **key, cmph_uint32 *keylen)
{
cmph_struct_vector_t *cmph_struct_vector = (cmph_struct_vector_t *)data;
char *keys_vd = (char *)cmph_struct_vector->vector;
2008-04-12 09:17:21 +03:00
size_t size;
2008-03-30 02:23:41 +02:00
*keylen = cmph_struct_vector->key_len;
2008-04-12 09:17:21 +03:00
size = *keylen;
*key = (char *)malloc(size);
memcpy(*key, (keys_vd + (cmph_struct_vector->position * cmph_struct_vector->struct_size) + cmph_struct_vector->key_offset), size);
cmph_struct_vector->position = cmph_struct_vector->position + 1;
return (int)(*keylen);
2008-03-30 02:23:41 +02:00
}
static int key_vector_read(void *data, char **key, cmph_uint32 *keylen)
{
cmph_vector_t *cmph_vector = (cmph_vector_t *)data;
char **keys_vd = (char **)cmph_vector->vector;
2008-04-12 09:17:21 +03:00
size_t size;
*keylen = (cmph_uint32)strlen(keys_vd[cmph_vector->position]);
2008-04-12 09:17:21 +03:00
size = *keylen;
*key = (char *)malloc(size + 1);
strcpy(*key, keys_vd[cmph_vector->position]);
cmph_vector->position = cmph_vector->position + 1;
return (int)(*keylen);
2005-07-26 00:26:17 +03:00
}
2005-01-24 22:25:58 +02:00
static void key_nlfile_dispose(void *data, char *key, cmph_uint32 keylen)
{
free(key);
}
2005-07-26 00:26:17 +03:00
2005-07-29 03:00:01 +03:00
static void key_vector_dispose(void *data, char *key, cmph_uint32 keylen)
{
free(key);
2005-07-29 03:00:01 +03:00
}
2005-01-24 22:25:58 +02:00
static void key_nlfile_rewind(void *data)
{
FILE *fd = (FILE *)data;
rewind(fd);
}
2008-03-30 02:23:41 +02:00
static void key_struct_vector_rewind(void *data)
{
cmph_struct_vector_t *cmph_struct_vector = (cmph_struct_vector_t *)data;
cmph_struct_vector->position = 0;
}
2005-07-26 00:26:17 +03:00
static void key_vector_rewind(void *data)
{
2005-10-10 20:43:21 +03:00
cmph_vector_t *cmph_vector = (cmph_vector_t *)data;
cmph_vector->position = 0;
2005-07-26 00:26:17 +03:00
}
2005-01-24 22:25:58 +02:00
static cmph_uint32 count_nlfile_keys(FILE *fd)
{
cmph_uint32 count = 0;
2009-03-15 01:24:05 +02:00
register char * ptr;
2005-01-24 22:25:58 +02:00
rewind(fd);
while(1)
{
char buf[BUFSIZ];
2011-12-26 23:12:24 +02:00
ptr = fgets(buf, BUFSIZ, fd);
2005-01-24 22:25:58 +02:00
if (feof(fd)) break;
2011-12-26 23:12:24 +02:00
if (ferror(fd) || ptr == NULL) {
perror("Error reading input file");
return 0;
}
2005-01-24 22:25:58 +02:00
if (buf[strlen(buf) - 1] != '\n') continue;
++count;
}
rewind(fd);
return count;
}
cmph_io_adapter_t *cmph_io_nlfile_adapter(FILE * keys_fd)
{
cmph_io_adapter_t * key_source = (cmph_io_adapter_t *)malloc(sizeof(cmph_io_adapter_t));
2005-01-24 22:25:58 +02:00
assert(key_source);
key_source->data = (void *)keys_fd;
key_source->nkeys = count_nlfile_keys(keys_fd);
key_source->read = key_nlfile_read;
key_source->dispose = key_nlfile_dispose;
key_source->rewind = key_nlfile_rewind;
return key_source;
}
2005-10-10 20:43:21 +03:00
void cmph_io_nlfile_adapter_destroy(cmph_io_adapter_t * key_source)
{
free(key_source);
}
2005-01-24 22:25:58 +02:00
cmph_io_adapter_t *cmph_io_nlnkfile_adapter(FILE * keys_fd, cmph_uint32 nkeys)
{
cmph_io_adapter_t * key_source = (cmph_io_adapter_t *)malloc(sizeof(cmph_io_adapter_t));
2005-01-24 22:25:58 +02:00
assert(key_source);
key_source->data = (void *)keys_fd;
key_source->nkeys = nkeys;
key_source->read = key_nlfile_read;
key_source->dispose = key_nlfile_dispose;
key_source->rewind = key_nlfile_rewind;
return key_source;
}
2005-10-10 20:43:21 +03:00
void cmph_io_nlnkfile_adapter_destroy(cmph_io_adapter_t * key_source)
{
free(key_source);
}
2008-03-30 02:23:41 +02:00
static cmph_io_adapter_t *cmph_io_struct_vector_new(void * vector, cmph_uint32 struct_size, cmph_uint32 key_offset, cmph_uint32 key_len, cmph_uint32 nkeys)
{
cmph_io_adapter_t * key_source = (cmph_io_adapter_t *)malloc(sizeof(cmph_io_adapter_t));
cmph_struct_vector_t * cmph_struct_vector = (cmph_struct_vector_t *)malloc(sizeof(cmph_struct_vector_t));
assert(key_source);
assert(cmph_struct_vector);
cmph_struct_vector->vector = vector;
cmph_struct_vector->position = 0;
cmph_struct_vector->struct_size = struct_size;
cmph_struct_vector->key_offset = key_offset;
cmph_struct_vector->key_len = key_len;
key_source->data = (void *)cmph_struct_vector;
key_source->nkeys = nkeys;
return key_source;
}
static void cmph_io_struct_vector_destroy(cmph_io_adapter_t * key_source)
{
cmph_struct_vector_t *cmph_struct_vector = (cmph_struct_vector_t *)key_source->data;
cmph_struct_vector->vector = NULL;
free(cmph_struct_vector);
free(key_source);
}
2005-10-10 20:43:21 +03:00
static cmph_io_adapter_t *cmph_io_vector_new(void * vector, cmph_uint32 nkeys)
{
cmph_io_adapter_t * key_source = (cmph_io_adapter_t *)malloc(sizeof(cmph_io_adapter_t));
cmph_vector_t * cmph_vector = (cmph_vector_t *)malloc(sizeof(cmph_vector_t));
2005-10-10 20:43:21 +03:00
assert(key_source);
assert(cmph_vector);
cmph_vector->vector = vector;
cmph_vector->position = 0;
key_source->data = (void *)cmph_vector;
key_source->nkeys = nkeys;
return key_source;
}
static void cmph_io_vector_destroy(cmph_io_adapter_t * key_source)
{
cmph_vector_t *cmph_vector = (cmph_vector_t *)key_source->data;
cmph_vector->vector = NULL;
free(cmph_vector);
free(key_source);
}
cmph_io_adapter_t *cmph_io_byte_vector_adapter(cmph_uint8 ** vector, cmph_uint32 nkeys)
{
cmph_io_adapter_t * key_source = cmph_io_vector_new(vector, nkeys);
key_source->read = key_byte_vector_read;
key_source->dispose = key_vector_dispose;
key_source->rewind = key_vector_rewind;
return key_source;
}
void cmph_io_byte_vector_adapter_destroy(cmph_io_adapter_t * key_source)
{
cmph_io_vector_destroy(key_source);
}
2008-03-30 02:23:41 +02:00
cmph_io_adapter_t *cmph_io_struct_vector_adapter(void * vector, cmph_uint32 struct_size, cmph_uint32 key_offset, cmph_uint32 key_len, cmph_uint32 nkeys)
{
cmph_io_adapter_t * key_source = cmph_io_struct_vector_new(vector, struct_size, key_offset, key_len, nkeys);
key_source->read = key_struct_vector_read;
key_source->dispose = key_vector_dispose;
key_source->rewind = key_struct_vector_rewind;
return key_source;
2008-03-30 02:23:41 +02:00
}
void cmph_io_struct_vector_adapter_destroy(cmph_io_adapter_t * key_source)
{
cmph_io_struct_vector_destroy(key_source);
2008-03-30 02:23:41 +02:00
}
2005-07-28 00:13:02 +03:00
cmph_io_adapter_t *cmph_io_vector_adapter(char ** vector, cmph_uint32 nkeys)
2005-01-24 22:25:58 +02:00
{
2005-10-10 20:43:21 +03:00
cmph_io_adapter_t * key_source = cmph_io_vector_new(vector, nkeys);
key_source->read = key_vector_read;
key_source->dispose = key_vector_dispose;
key_source->rewind = key_vector_rewind;
return key_source;
}
void cmph_io_vector_adapter_destroy(cmph_io_adapter_t * key_source)
{
cmph_io_vector_destroy(key_source);
2005-01-24 22:25:58 +02:00
}
cmph_config_t *cmph_config_new(cmph_io_adapter_t *key_source)
2004-12-23 15:16:30 +02:00
{
cmph_config_t *mph = NULL;
mph = __config_new(key_source);
2004-12-23 15:16:30 +02:00
assert(mph);
2005-01-25 23:06:58 +02:00
mph->algo = CMPH_CHM; // default value
mph->data = chm_config_new();
2004-12-23 15:16:30 +02:00
return mph;
}
void cmph_config_set_algo(cmph_config_t *mph, CMPH_ALGO algo)
{
if (algo != mph->algo)
{
switch (mph->algo)
{
case CMPH_CHM:
2005-07-29 03:00:01 +03:00
chm_config_destroy(mph);
2005-07-28 00:13:02 +03:00
break;
case CMPH_BMZ:
2005-07-29 03:00:01 +03:00
bmz_config_destroy(mph);
2005-07-28 00:13:02 +03:00
break;
case CMPH_BMZ8:
bmz8_config_destroy(mph);
break;
2005-07-28 00:13:02 +03:00
case CMPH_BRZ:
brz_config_destroy(mph);
2005-07-28 00:13:02 +03:00
break;
2006-08-03 23:00:11 +03:00
case CMPH_FCH:
fch_config_destroy(mph);
break;
2008-03-23 02:46:34 +02:00
case CMPH_BDZ:
bdz_config_destroy(mph);
break;
2008-03-25 22:20:55 +02:00
case CMPH_BDZ_PH:
bdz_ph_config_destroy(mph);
break;
case CMPH_CHD_PH:
chd_ph_config_destroy(mph);
break;
2009-04-08 02:16:40 +03:00
case CMPH_CHD:
chd_config_destroy(mph);
break;
default:
2005-07-28 00:13:02 +03:00
assert(0);
}
switch(algo)
{
case CMPH_CHM:
2005-07-28 00:13:02 +03:00
mph->data = chm_config_new();
break;
case CMPH_BMZ:
2005-07-28 00:13:02 +03:00
mph->data = bmz_config_new();
break;
case CMPH_BMZ8:
2005-09-06 17:11:37 +03:00
mph->data = bmz8_config_new();
break;
2005-07-28 00:13:02 +03:00
case CMPH_BRZ:
mph->data = brz_config_new();
2005-09-06 17:11:37 +03:00
break;
2006-08-03 23:00:11 +03:00
case CMPH_FCH:
mph->data = fch_config_new();
break;
2008-03-23 02:46:34 +02:00
case CMPH_BDZ:
mph->data = bdz_config_new();
break;
2008-03-25 22:20:55 +02:00
case CMPH_BDZ_PH:
mph->data = bdz_ph_config_new();
break;
case CMPH_CHD_PH:
mph->data = chd_ph_config_new();
break;
2009-04-08 02:16:40 +03:00
case CMPH_CHD:
mph->data = chd_config_new(mph);
break;
default:
2005-07-28 00:13:02 +03:00
assert(0);
}
}
mph->algo = algo;
}
void cmph_config_set_tmp_dir(cmph_config_t *mph, cmph_uint8 *tmp_dir)
{
if (mph->algo == CMPH_BRZ)
{
2006-08-03 23:00:11 +03:00
brz_config_set_tmp_dir(mph, tmp_dir);
}
}
void cmph_config_set_mphf_fd(cmph_config_t *mph, FILE *mphf_fd)
{
if (mph->algo == CMPH_BRZ)
{
2006-08-03 23:00:11 +03:00
brz_config_set_mphf_fd(mph, mphf_fd);
}
}
2008-04-12 09:17:21 +03:00
void cmph_config_set_b(cmph_config_t *mph, cmph_uint32 b)
{
if (mph->algo == CMPH_BRZ)
{
2006-08-03 23:00:11 +03:00
brz_config_set_b(mph, b);
}
else if (mph->algo == CMPH_BDZ)
2008-03-23 02:46:34 +02:00
{
bdz_config_set_b(mph, b);
}
else if (mph->algo == CMPH_CHD_PH)
{
chd_ph_config_set_b(mph, b);
}
else if (mph->algo == CMPH_CHD)
2009-04-08 02:16:40 +03:00
{
chd_config_set_b(mph, b);
}
}
void cmph_config_set_keys_per_bin(cmph_config_t *mph, cmph_uint32 keys_per_bin)
{
if (mph->algo == CMPH_CHD_PH)
{
chd_ph_config_set_keys_per_bin(mph, keys_per_bin);
}
else if (mph->algo == CMPH_CHD)
2009-04-08 02:16:40 +03:00
{
chd_config_set_keys_per_bin(mph, keys_per_bin);
}
}
void cmph_config_set_memory_availability(cmph_config_t *mph, cmph_uint32 memory_availability)
{
if (mph->algo == CMPH_BRZ)
{
2006-08-03 23:00:11 +03:00
brz_config_set_memory_availability(mph, memory_availability);
}
}
void cmph_config_destroy(cmph_config_t *mph)
2004-12-23 15:16:30 +02:00
{
2008-03-29 03:48:15 +02:00
if(mph)
2004-12-23 15:16:30 +02:00
{
2008-03-29 03:48:15 +02:00
DEBUGP("Destroying mph with algo %s\n", cmph_names[mph->algo]);
switch (mph->algo)
{
case CMPH_CHM:
chm_config_destroy(mph);
break;
case CMPH_BMZ: /* included -- Fabiano */
bmz_config_destroy(mph);
break;
case CMPH_BMZ8: /* included -- Fabiano */
bmz8_config_destroy(mph);
2008-03-29 03:48:15 +02:00
break;
case CMPH_BRZ: /* included -- Fabiano */
brz_config_destroy(mph);
2008-03-29 03:48:15 +02:00
break;
case CMPH_FCH: /* included -- Fabiano */
fch_config_destroy(mph);
2008-03-29 03:48:15 +02:00
break;
case CMPH_BDZ: /* included -- Fabiano */
bdz_config_destroy(mph);
2008-03-29 03:48:15 +02:00
break;
case CMPH_BDZ_PH: /* included -- Fabiano */
bdz_ph_config_destroy(mph);
break;
case CMPH_CHD_PH: /* included -- Fabiano */
chd_ph_config_destroy(mph);
2008-03-29 03:48:15 +02:00
break;
2009-04-08 02:16:40 +03:00
case CMPH_CHD: /* included -- Fabiano */
chd_config_destroy(mph);
break;
2008-03-29 03:48:15 +02:00
default:
assert(0);
}
__config_destroy(mph);
2004-12-23 15:16:30 +02:00
}
}
void cmph_config_set_verbosity(cmph_config_t *mph, cmph_uint32 verbosity)
2004-12-23 15:16:30 +02:00
{
mph->verbosity = verbosity;
}
void cmph_config_set_hashfuncs(cmph_config_t *mph, CMPH_HASH *hashfuncs)
2004-12-23 15:16:30 +02:00
{
switch (mph->algo)
{
2005-01-25 23:06:58 +02:00
case CMPH_CHM:
chm_config_set_hashfuncs(mph, hashfuncs);
2004-12-23 15:16:30 +02:00
break;
2005-01-18 23:06:08 +02:00
case CMPH_BMZ: /* included -- Fabiano */
bmz_config_set_hashfuncs(mph, hashfuncs);
2004-12-23 15:16:30 +02:00
break;
case CMPH_BMZ8: /* included -- Fabiano */
bmz8_config_set_hashfuncs(mph, hashfuncs);
break;
2005-07-28 00:13:02 +03:00
case CMPH_BRZ: /* included -- Fabiano */
brz_config_set_hashfuncs(mph, hashfuncs);
2005-07-28 00:13:02 +03:00
break;
2006-08-03 23:00:11 +03:00
case CMPH_FCH: /* included -- Fabiano */
fch_config_set_hashfuncs(mph, hashfuncs);
break;
2008-03-23 02:46:34 +02:00
case CMPH_BDZ: /* included -- Fabiano */
bdz_config_set_hashfuncs(mph, hashfuncs);
break;
2008-03-25 22:20:55 +02:00
case CMPH_BDZ_PH: /* included -- Fabiano */
bdz_ph_config_set_hashfuncs(mph, hashfuncs);
break;
case CMPH_CHD_PH: /* included -- Fabiano */
chd_ph_config_set_hashfuncs(mph, hashfuncs);
break;
2009-04-08 02:16:40 +03:00
case CMPH_CHD: /* included -- Fabiano */
chd_config_set_hashfuncs(mph, hashfuncs);
break;
2004-12-23 15:16:30 +02:00
default:
break;
}
return;
}
2008-04-12 09:17:21 +03:00
void cmph_config_set_graphsize(cmph_config_t *mph, double c)
{
mph->c = c;
return;
}
2004-12-23 15:16:30 +02:00
cmph_t *cmph_new(cmph_config_t *mph)
2004-12-23 15:16:30 +02:00
{
cmph_t *mphf = NULL;
2008-04-12 09:17:21 +03:00
double c = mph->c;
DEBUGP("Creating mph with algorithm %s\n", cmph_names[mph->algo]);
switch (mph->algo)
2004-12-23 15:16:30 +02:00
{
2005-01-25 23:06:58 +02:00
case CMPH_CHM:
DEBUGP("Creating chm hash\n");
mphf = chm_new(mph, c);
2004-12-23 15:16:30 +02:00
break;
2005-01-18 23:06:08 +02:00
case CMPH_BMZ: /* included -- Fabiano */
2004-12-23 15:16:30 +02:00
DEBUGP("Creating bmz hash\n");
mphf = bmz_new(mph, c);
2004-12-23 15:16:30 +02:00
break;
case CMPH_BMZ8: /* included -- Fabiano */
DEBUGP("Creating bmz8 hash\n");
mphf = bmz8_new(mph, c);
break;
2005-07-28 00:13:02 +03:00
case CMPH_BRZ: /* included -- Fabiano */
DEBUGP("Creating brz hash\n");
if (c >= 2.0) brz_config_set_algo(mph, CMPH_FCH);
else brz_config_set_algo(mph, CMPH_BMZ8);
mphf = brz_new(mph, c);
2005-07-28 00:13:02 +03:00
break;
2006-08-03 23:00:11 +03:00
case CMPH_FCH: /* included -- Fabiano */
DEBUGP("Creating fch hash\n");
mphf = fch_new(mph, c);
break;
2008-03-23 02:46:34 +02:00
case CMPH_BDZ: /* included -- Fabiano */
DEBUGP("Creating bdz hash\n");
mphf = bdz_new(mph, c);
break;
2008-03-25 22:20:55 +02:00
case CMPH_BDZ_PH: /* included -- Fabiano */
DEBUGP("Creating bdz_ph hash\n");
mphf = bdz_ph_new(mph, c);
break;
case CMPH_CHD_PH: /* included -- Fabiano */
DEBUGP("Creating chd_ph hash\n");
mphf = chd_ph_new(mph, c);
break;
2009-04-08 02:16:40 +03:00
case CMPH_CHD: /* included -- Fabiano */
DEBUGP("Creating chd hash\n");
mphf = chd_new(mph, c);
break;
2004-12-23 15:16:30 +02:00
default:
assert(0);
}
return mphf;
}
int cmph_dump(cmph_t *mphf, FILE *f)
2004-12-23 15:16:30 +02:00
{
switch (mphf->algo)
{
2005-01-25 23:06:58 +02:00
case CMPH_CHM:
return chm_dump(mphf, f);
2005-01-18 23:06:08 +02:00
case CMPH_BMZ: /* included -- Fabiano */
return bmz_dump(mphf, f);
case CMPH_BMZ8: /* included -- Fabiano */
return bmz8_dump(mphf, f);
2005-07-28 00:13:02 +03:00
case CMPH_BRZ: /* included -- Fabiano */
return brz_dump(mphf, f);
2006-08-03 23:00:11 +03:00
case CMPH_FCH: /* included -- Fabiano */
return fch_dump(mphf, f);
2008-03-23 02:46:34 +02:00
case CMPH_BDZ: /* included -- Fabiano */
return bdz_dump(mphf, f);
2008-03-25 22:20:55 +02:00
case CMPH_BDZ_PH: /* included -- Fabiano */
return bdz_ph_dump(mphf, f);
case CMPH_CHD_PH: /* included -- Fabiano */
return chd_ph_dump(mphf, f);
2009-04-08 02:16:40 +03:00
case CMPH_CHD: /* included -- Fabiano */
return chd_dump(mphf, f);
2004-12-23 15:16:30 +02:00
default:
assert(0);
}
assert(0);
return 0;
}
cmph_t *cmph_load(FILE *f)
2004-12-23 15:16:30 +02:00
{
cmph_t *mphf = NULL;
2004-12-23 15:16:30 +02:00
DEBUGP("Loading mphf generic parts\n");
mphf = __cmph_load(f);
2004-12-23 15:16:30 +02:00
if (mphf == NULL) return NULL;
DEBUGP("Loading mphf algorithm dependent parts\n");
switch (mphf->algo)
{
2005-01-25 23:06:58 +02:00
case CMPH_CHM:
chm_load(f, mphf);
2004-12-23 15:16:30 +02:00
break;
2005-01-18 23:06:08 +02:00
case CMPH_BMZ: /* included -- Fabiano */
DEBUGP("Loading bmz algorithm dependent parts\n");
bmz_load(f, mphf);
2004-12-23 15:16:30 +02:00
break;
case CMPH_BMZ8: /* included -- Fabiano */
DEBUGP("Loading bmz8 algorithm dependent parts\n");
bmz8_load(f, mphf);
break;
2005-07-28 00:13:02 +03:00
case CMPH_BRZ: /* included -- Fabiano */
DEBUGP("Loading brz algorithm dependent parts\n");
brz_load(f, mphf);
2005-07-28 00:13:02 +03:00
break;
2006-08-03 23:00:11 +03:00
case CMPH_FCH: /* included -- Fabiano */
DEBUGP("Loading fch algorithm dependent parts\n");
fch_load(f, mphf);
break;
2008-03-23 02:46:34 +02:00
case CMPH_BDZ: /* included -- Fabiano */
DEBUGP("Loading bdz algorithm dependent parts\n");
bdz_load(f, mphf);
break;
2008-03-25 22:20:55 +02:00
case CMPH_BDZ_PH: /* included -- Fabiano */
DEBUGP("Loading bdz_ph algorithm dependent parts\n");
bdz_ph_load(f, mphf);
break;
case CMPH_CHD_PH: /* included -- Fabiano */
DEBUGP("Loading chd_ph algorithm dependent parts\n");
chd_ph_load(f, mphf);
break;
2009-04-08 02:16:40 +03:00
case CMPH_CHD: /* included -- Fabiano */
DEBUGP("Loading chd algorithm dependent parts\n");
chd_load(f, mphf);
break;
2004-12-23 15:16:30 +02:00
default:
assert(0);
}
DEBUGP("Loaded mphf\n");
return mphf;
}
cmph_uint32 cmph_search(cmph_t *mphf, const char *key, cmph_uint32 keylen)
2004-12-23 15:16:30 +02:00
{
2008-03-26 22:26:48 +02:00
DEBUGP("mphf algorithm: %u \n", mphf->algo);
2004-12-23 15:16:30 +02:00
switch(mphf->algo)
{
2005-01-25 23:06:58 +02:00
case CMPH_CHM:
return chm_search(mphf, key, keylen);
2005-01-18 23:06:08 +02:00
case CMPH_BMZ: /* included -- Fabiano */
DEBUGP("bmz algorithm search\n");
return bmz_search(mphf, key, keylen);
case CMPH_BMZ8: /* included -- Fabiano */
DEBUGP("bmz8 algorithm search\n");
return bmz8_search(mphf, key, keylen);
2005-07-28 00:13:02 +03:00
case CMPH_BRZ: /* included -- Fabiano */
DEBUGP("brz algorithm search\n");
return brz_search(mphf, key, keylen);
2006-08-03 23:00:11 +03:00
case CMPH_FCH: /* included -- Fabiano */
DEBUGP("fch algorithm search\n");
2006-08-03 23:00:11 +03:00
return fch_search(mphf, key, keylen);
2008-03-23 02:46:34 +02:00
case CMPH_BDZ: /* included -- Fabiano */
DEBUGP("bdz algorithm search\n");
2008-03-23 02:46:34 +02:00
return bdz_search(mphf, key, keylen);
2008-03-25 22:20:55 +02:00
case CMPH_BDZ_PH: /* included -- Fabiano */
DEBUGP("bdz_ph algorithm search\n");
2008-03-25 22:20:55 +02:00
return bdz_ph_search(mphf, key, keylen);
case CMPH_CHD_PH: /* included -- Fabiano */
DEBUGP("chd_ph algorithm search\n");
return chd_ph_search(mphf, key, keylen);
2009-04-08 02:16:40 +03:00
case CMPH_CHD: /* included -- Fabiano */
DEBUGP("chd algorithm search\n");
2009-04-08 02:16:40 +03:00
return chd_search(mphf, key, keylen);
2004-12-23 15:16:30 +02:00
default:
assert(0);
}
assert(0);
return 0;
2004-12-23 15:16:30 +02:00
}
cmph_uint32 cmph_size(cmph_t *mphf)
2004-12-23 15:16:30 +02:00
{
return mphf->size;
}
void cmph_destroy(cmph_t *mphf)
2004-12-23 15:16:30 +02:00
{
switch(mphf->algo)
{
2005-01-25 23:06:58 +02:00
case CMPH_CHM:
chm_destroy(mphf);
2004-12-23 15:16:30 +02:00
return;
2005-01-18 23:06:08 +02:00
case CMPH_BMZ: /* included -- Fabiano */
bmz_destroy(mphf);
2004-12-23 15:16:30 +02:00
return;
case CMPH_BMZ8: /* included -- Fabiano */
bmz8_destroy(mphf);
return;
2005-07-28 00:13:02 +03:00
case CMPH_BRZ: /* included -- Fabiano */
brz_destroy(mphf);
2005-07-28 00:13:02 +03:00
return;
2006-08-03 23:00:11 +03:00
case CMPH_FCH: /* included -- Fabiano */
fch_destroy(mphf);
2006-08-03 23:00:11 +03:00
return;
2008-03-23 02:46:34 +02:00
case CMPH_BDZ: /* included -- Fabiano */
bdz_destroy(mphf);
2008-03-25 22:20:55 +02:00
return;
case CMPH_BDZ_PH: /* included -- Fabiano */
bdz_ph_destroy(mphf);
return;
case CMPH_CHD_PH: /* included -- Fabiano */
chd_ph_destroy(mphf);
2008-03-23 02:46:34 +02:00
return;
2009-04-08 02:16:40 +03:00
case CMPH_CHD: /* included -- Fabiano */
chd_destroy(mphf);
return;
default:
2004-12-23 15:16:30 +02:00
assert(0);
}
assert(0);
return;
}
2008-03-26 22:26:48 +02:00
/** \fn void cmph_pack(cmph_t *mphf, void *packed_mphf);
* \brief Support the ability to pack a perfect hash function into a preallocated contiguous memory space pointed by packed_mphf.
* \param mphf pointer to the resulting mphf
* \param packed_mphf pointer to the contiguous memory area used to store the resulting mphf. The size of packed_mphf must be at least cmph_packed_size()
2008-03-26 22:26:48 +02:00
*/
void cmph_pack(cmph_t *mphf, void *packed_mphf)
{
// packing algorithm type to be used in cmph.c
cmph_uint32 * ptr = (cmph_uint32 *) packed_mphf;
2008-03-26 22:26:48 +02:00
*ptr++ = mphf->algo;
DEBUGP("mphf->algo = %u\n", mphf->algo);
switch(mphf->algo)
{
case CMPH_CHM:
chm_pack(mphf, ptr);
break;
case CMPH_BMZ: /* included -- Fabiano */
bmz_pack(mphf, ptr);
break;
case CMPH_BMZ8: /* included -- Fabiano */
bmz8_pack(mphf, ptr);
break;
case CMPH_BRZ: /* included -- Fabiano */
brz_pack(mphf, ptr);
break;
case CMPH_FCH: /* included -- Fabiano */
fch_pack(mphf, ptr);
break;
case CMPH_BDZ: /* included -- Fabiano */
bdz_pack(mphf, ptr);
break;
case CMPH_BDZ_PH: /* included -- Fabiano */
bdz_ph_pack(mphf, ptr);
break;
case CMPH_CHD_PH: /* included -- Fabiano */
chd_ph_pack(mphf, ptr);
break;
2009-04-08 02:16:40 +03:00
case CMPH_CHD: /* included -- Fabiano */
chd_pack(mphf, ptr);
break;
default:
2008-03-26 22:26:48 +02:00
assert(0);
}
return;
}
/** \fn cmph_uint32 cmph_packed_size(cmph_t *mphf);
* \brief Return the amount of space needed to pack mphf.
* \param mphf pointer to a mphf
* \return the size of the packed function or zero for failures
*/
2008-03-26 22:26:48 +02:00
cmph_uint32 cmph_packed_size(cmph_t *mphf)
{
switch(mphf->algo)
{
case CMPH_CHM:
return chm_packed_size(mphf);
case CMPH_BMZ: /* included -- Fabiano */
return bmz_packed_size(mphf);
case CMPH_BMZ8: /* included -- Fabiano */
return bmz8_packed_size(mphf);
case CMPH_BRZ: /* included -- Fabiano */
return brz_packed_size(mphf);
case CMPH_FCH: /* included -- Fabiano */
return fch_packed_size(mphf);
case CMPH_BDZ: /* included -- Fabiano */
return bdz_packed_size(mphf);
case CMPH_BDZ_PH: /* included -- Fabiano */
return bdz_ph_packed_size(mphf);
case CMPH_CHD_PH: /* included -- Fabiano */
return chd_ph_packed_size(mphf);
2009-04-08 02:16:40 +03:00
case CMPH_CHD: /* included -- Fabiano */
return chd_packed_size(mphf);
default:
2008-03-26 22:26:48 +02:00
assert(0);
}
return 0; // FAILURE
}
/** cmph_uint32 cmph_search(void *packed_mphf, const char *key, cmph_uint32 keylen);
* \brief Use the packed mphf to do a search.
2008-03-26 22:26:48 +02:00
* \param packed_mphf pointer to the packed mphf
* \param key key to be hashed
* \param keylen key legth in bytes
* \return The mphf value
*/
cmph_uint32 cmph_search_packed(void *packed_mphf, const char *key, cmph_uint32 keylen)
{
cmph_uint32 *ptr = (cmph_uint32 *)packed_mphf;
// fprintf(stderr, "algo:%u\n", *ptr);
switch(*ptr)
{
case CMPH_CHM:
return chm_search_packed(++ptr, key, keylen);
case CMPH_BMZ: /* included -- Fabiano */
return bmz_search_packed(++ptr, key, keylen);
case CMPH_BMZ8: /* included -- Fabiano */
return bmz8_search_packed(++ptr, key, keylen);
case CMPH_BRZ: /* included -- Fabiano */
return brz_search_packed(++ptr, key, keylen);
case CMPH_FCH: /* included -- Fabiano */
return fch_search_packed(++ptr, key, keylen);
case CMPH_BDZ: /* included -- Fabiano */
return bdz_search_packed(++ptr, key, keylen);
case CMPH_BDZ_PH: /* included -- Fabiano */
return bdz_ph_search_packed(++ptr, key, keylen);
case CMPH_CHD_PH: /* included -- Fabiano */
return chd_ph_search_packed(++ptr, key, keylen);
2009-04-08 02:16:40 +03:00
case CMPH_CHD: /* included -- Fabiano */
return chd_search_packed(++ptr, key, keylen);
default:
2008-03-26 22:26:48 +02:00
assert(0);
}
return 0; // FAILURE
}