Add a new hash datatype to do speedy lookups of read only uniform data, like md5's.

remotes/origin/master
Victor Julien 13 years ago
parent 1bb0199dd7
commit 8cfc23ee22

@ -198,6 +198,7 @@ util-unittest-helper.c util-unittest-helper.h \
util-hash.c util-hash.h \
util-hashlist.c util-hashlist.h \
util-hash-lookup3.c util-hash-lookup3.h \
util-rohash.c util-rohash.h \
util-bloomfilter.c util-bloomfilter.h \
util-bloomfilter-counting.c util-bloomfilter-counting.h \
util-pool.c util-pool.h \

@ -37,6 +37,9 @@ on 1 byte), but shoehorning those bytes into integers efficiently is messy.
#ifndef __UTIL_HASH_LOOKUP3_H__
#define __UTIL_HASH_LOOKUP3_H__
#define hashsize(n) ((uint32_t)1<<(n))
#define hashmask(n) (hashsize(n)-1)
uint32_t hashword(const uint32_t *k, /* the key, an array of uint32_t values */
size_t length, /* the length of the key, in uint32_ts */
uint32_t initval); /* the previous hash, or an arbitrary value */

@ -0,0 +1,238 @@
/* Copyright (C) 2007-2012 Open Information Security Foundation
*
* You can copy, redistribute or modify this Program under the terms of
* the GNU General Public License version 2 as published by the Free
* Software Foundation.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* version 2 along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
* 02110-1301, USA.
*/
/**
* \file
*
* \author Victor Julien <victor@inliniac.net>
*
* Chained read only hash table implementation, meaning that
* after the initial fill no changes are allowed.
*
* Loading takes 2 stages.
* - stage1 maps data
* - stage2 fills blob
*
* \todo a bloomfilter in the ROHashTableOffsets could possibly prevent
* a lot of cache misses when validating a potential match
*
* \todo maybe add a user ctx to be returned instead, something like a
* 4/8 byte ptr or simply a flag
*/
#include "suricata-common.h"
#include "util-hash.h"
#include "util-unittest.h"
#include "util-memcmp.h"
#include "util-hash-lookup3.h"
#include "queue.h"
#include "util-rohash.h"
/** item_size data beyond this header */
typedef struct ROHashTableItem_ {
uint32_t pos; /**< position relative to other values with same hash */
TAILQ_ENTRY(ROHashTableItem_) next;
} ROHashTableItem;
/** offset table */
typedef struct ROHashTableOffsets_ {
uint32_t cnt; /**< number of items for this hash */
uint32_t offset; /**< position in the blob of the first item */
} ROHashTableOffsets;
/** \brief initialize a new rohash
*
* \param hash_bits hash size as 2^hash_bits, so power of 2
* \param item_size size of the data to store
*
* \retval table ptr or NULL on error
*/
ROHashTable *ROHashInit(uint8_t hash_bits, uint16_t item_size) {
if (item_size % 4 != 0 || item_size == 0) {
SCLogError(SC_ERR_HASH_TABLE_INIT, "data size must be multiple of 4");
return NULL;
}
if (hash_bits < 4 || hash_bits > 32) {
SCLogError(SC_ERR_HASH_TABLE_INIT, "invalid hash_bits setting, valid range is 4-32");
return NULL;
}
uint32_t size = hashsize(hash_bits) * sizeof(ROHashTableOffsets);
ROHashTable *table = SCMalloc(sizeof(ROHashTable) + size);
if (table == NULL) {
SCLogError(SC_ERR_HASH_TABLE_INIT, "failed to alloc memory");
return NULL;
}
memset(table, 0, sizeof(ROHashTable) + size);
table->items = 0;
table->item_size = item_size;
table->hash_bits = hash_bits;
TAILQ_INIT(&table->head);
return table;
}
void ROHashFree(ROHashTable *table) {
if (table != NULL) {
if (table->data != NULL) {
SCFree(table->data);
}
SCFree(table);
}
}
/**
* \retval NULL not found
* \retval ptr found
*/
void *ROHashLookup(ROHashTable *table, void *data, uint16_t size) {
if (data == NULL || size != table->item_size) {
SCReturnPtr(NULL, "void");
}
uint32_t hash = hashword(data, table->item_size/4, 0) & hashmask(table->hash_bits);
/* get offsets start */
ROHashTableOffsets *os = (void *)table + sizeof(ROHashTable);
ROHashTableOffsets *o = &os[hash];
/* no matches */
if (o->cnt == 0) {
SCReturnPtr(NULL, "void");
}
uint32_t u;
for (u = 0; u < o->cnt; u++) {
uint32_t offset = (o->offset + u) * table->item_size;
if (SCMemcmp(table->data + offset, data, table->item_size) == 0) {
SCReturnPtr(table->data + offset, "void");
}
}
SCReturnPtr(NULL, "void");
}
/** \brief Add a new value to the hash
*
* \note can only be done when table isn't in a locked state yet
*
* \param table the hash table
* \param value value to add
* \param size value size. *MUST* match table item_size
*
* \retval 0 error
* \retval 1 ok
*/
int ROHashInitQueueValue(ROHashTable *table, void *value, uint16_t size) {
if (table->locked) {
SCLogError(SC_ERR_HASH_TABLE_INIT, "can't add value to locked table");
return 0;
}
if (table->item_size != size) {
SCLogError(SC_ERR_HASH_TABLE_INIT, "wrong size for data %u != %u", size, table->item_size);
return 0;
}
ROHashTableItem *item = SCMalloc(sizeof(ROHashTableItem) + table->item_size);
if (item != NULL) {
memset(item, 0x00, sizeof(ROHashTableItem));
memcpy((void *)item + sizeof(ROHashTableItem), value, table->item_size);
TAILQ_INSERT_TAIL(&table->head, item, next);
return 1;
}
return 0;
}
/** \brief create final hash data structure
*
* \param table the hash table
*
* \retval 0 error
* \retval 1 ok
*
* \note after this call the nothing can be added to the hash anymore.
*/
int ROHashInitFinalize(ROHashTable *table) {
if (table->locked) {
SCLogError(SC_ERR_HASH_TABLE_INIT, "table already locked");
return 0;
}
ROHashTableItem *item = NULL;
ROHashTableOffsets *os = (void *)table + sizeof(ROHashTable);
/* count items per hash value */
TAILQ_FOREACH(item, &table->head, next) {
uint32_t hash = hashword((void *)item + sizeof(*item), table->item_size/4, 0) & hashmask(table->hash_bits);
ROHashTableOffsets *o = &os[hash];
item->pos = o->cnt;
o->cnt++;
table->items++;
}
if (table->items == 0) {
SCLogError(SC_ERR_HASH_TABLE_INIT, "no items");
return 0;
}
/* get the data block */
uint32_t newsize = table->items * table->item_size;
table->data = SCMalloc(newsize);
if (table->data == NULL) {
SCLogError(SC_ERR_HASH_TABLE_INIT, "failed to alloc memory");
return 0;
}
memset(table->data, 0x00, newsize);
/* calc offsets into the block per hash value */
uint32_t total = 0;
uint32_t x;
for (x = 0; x < hashsize(table->hash_bits); x++) {
ROHashTableOffsets *o = &os[x];
if (o->cnt == 0)
continue;
o->offset = total;
total += o->cnt;
}
/* copy each value into the data block */
TAILQ_FOREACH(item, &table->head, next) {
uint32_t hash = hashword((void *)item + sizeof(*item), table->item_size/4, 0) & hashmask(table->hash_bits);
ROHashTableOffsets *o = &os[hash];
uint32_t offset = (o->offset + item->pos) * table->item_size;
memcpy(table->data + offset, (void *)item + sizeof(*item), table->item_size);
}
/* clean up temp items */
while ((item = TAILQ_FIRST(&table->head))) {
TAILQ_REMOVE(&table->head, item, next);
SCFree(item);
}
table->locked = 1;
return 1;
}

@ -0,0 +1,45 @@
/* Copyright (C) 2007-2012 Open Information Security Foundation
*
* You can copy, redistribute or modify this Program under the terms of
* the GNU General Public License version 2 as published by the Free
* Software Foundation.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* version 2 along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
* 02110-1301, USA.
*/
/**
* \file
*
* \author Victor Julien <victor@inliniac.net>
*/
#ifndef __UTIL_ROHASH_H__
#define __UTIL_ROHASH_H__
typedef struct ROHashTable_ {
uint8_t locked;
uint8_t hash_bits;
uint16_t item_size;
uint32_t items;
void *data;
TAILQ_HEAD(, ROHashTableItem_) head;
} ROHashTable;
/* init time */
ROHashTable *ROHashInit(uint8_t hash_bits, uint16_t item_size);
int ROHashInitFinalize(ROHashTable *table);
void ROHashFree(ROHashTable *table);
int ROHashInitQueueValue(ROHashTable *table, void *value, uint16_t size);
/* run time */
void *ROHashLookup(ROHashTable *table, void *data, uint16_t size);
#endif /* __UTIL_ROHASH_H__ */
Loading…
Cancel
Save