|
|
|
/*
|
|
|
|
* upb - a minimalist implementation of protocol buffers.
|
|
|
|
*
|
|
|
|
* Copyright (c) 2009 Google Inc. See LICENSE for details.
|
|
|
|
* Author: Josh Haberman <jhaberman@gmail.com>
|
|
|
|
*
|
|
|
|
* This file defines very fast int->struct (inttable) and string->struct
|
|
|
|
* (strtable) hash tables. The struct can be of any size, and it is stored
|
|
|
|
* in the table itself, for cache-friendly performance.
|
|
|
|
*
|
|
|
|
* The table uses internal chaining with Brent's variation (inspired by the
|
|
|
|
* Lua implementation of hash tables). The hash function for strings is
|
|
|
|
* Austin Appleby's "MurmurHash."
|
|
|
|
*
|
|
|
|
* This header is internal to upb; its interface should not be considered
|
|
|
|
* public or stable.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef UPB_TABLE_H_
|
|
|
|
#define UPB_TABLE_H_
|
|
|
|
|
|
|
|
#include <assert.h>
|
|
|
|
#include <stddef.h>
|
|
|
|
#include "upb.h"
|
|
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#define UPB_END_OF_CHAIN (uint32_t)-1
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
bool has_entry:1;
|
|
|
|
// The rest of the bits are the user's.
|
|
|
|
} upb_inttable_value;
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
uint32_t key;
|
|
|
|
uint32_t next; // Internal chaining.
|
|
|
|
} upb_inttable_header;
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
upb_inttable_header hdr;
|
|
|
|
upb_inttable_value val;
|
|
|
|
} upb_inttable_entry;
|
|
|
|
|
|
|
|
// TODO: consider storing the hash in the entry. This would avoid the need to
|
|
|
|
// rehash on table resizes, but more importantly could possibly improve lookup
|
|
|
|
// performance by letting us compare hashes before comparing lengths or the
|
|
|
|
// strings themselves.
|
|
|
|
typedef struct {
|
|
|
|
char *key; // We own, nullz. TODO: store explicit len?
|
|
|
|
uint32_t next; // Internal chaining.
|
|
|
|
} upb_strtable_header;
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
upb_strtable_header hdr;
|
|
|
|
uint32_t val; // Val is at least 32 bits.
|
|
|
|
} upb_strtable_entry;
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
void *entries; // Hash table.
|
|
|
|
uint32_t count; // Number of entries in the hash part.
|
|
|
|
uint32_t mask; // Mask to turn hash value -> bucket.
|
|
|
|
uint16_t entry_size; // Size of each entry.
|
|
|
|
uint16_t value_size; // Size of each value.
|
|
|
|
uint8_t size_lg2; // Size of the hash table part is 2^size_lg2 entries.
|
|
|
|
} upb_table;
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
upb_table t;
|
|
|
|
} upb_strtable;
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
upb_table t;
|
|
|
|
void *array; // Array part of the table.
|
|
|
|
uint32_t array_size; // Array part size.
|
|
|
|
uint32_t array_count; // Array part number of elements.
|
|
|
|
} upb_inttable;
|
|
|
|
|
|
|
|
// Initialize and free a table, respectively. Specify the initial size
|
|
|
|
// with 'size' (the size will be increased as necessary). Value size
|
|
|
|
// specifies how many bytes each value in the table is.
|
|
|
|
//
|
|
|
|
// WARNING! The lowest bit of every entry is reserved by the hash table.
|
|
|
|
// It will always be overwritten when you insert, and must not be modified
|
|
|
|
// when looked up!
|
|
|
|
void upb_inttable_init(upb_inttable *table, uint32_t size, uint16_t value_size);
|
|
|
|
void upb_inttable_free(upb_inttable *table);
|
|
|
|
void upb_strtable_init(upb_strtable *table, uint32_t size, uint16_t value_size);
|
|
|
|
void upb_strtable_free(upb_strtable *table);
|
|
|
|
|
|
|
|
// Number of values in the hash table.
|
|
|
|
INLINE uint32_t upb_table_count(const upb_table *t) { return t->count; }
|
|
|
|
INLINE uint32_t upb_inttable_count(const upb_inttable *t) {
|
|
|
|
return t->array_count + upb_table_count(&t->t);
|
|
|
|
}
|
|
|
|
INLINE uint32_t upb_strtable_count(const upb_strtable *t) {
|
|
|
|
return upb_table_count(&t->t);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Inserts the given key into the hashtable with the given value. The key must
|
|
|
|
// not already exist in the hash table. The data will be copied from val into
|
|
|
|
// the hashtable (the amount of data copied comes from value_size when the
|
|
|
|
// table was constructed). Therefore the data at val may be freed once the
|
|
|
|
// call returns. For string tables, the table takes ownership of the string.
|
|
|
|
//
|
|
|
|
// WARNING: the lowest bit of val is reserved and will be overwritten!
|
|
|
|
void upb_inttable_insert(upb_inttable *t, uint32_t key, const void *val);
|
|
|
|
// TODO: may want to allow for more complex keys with custom hash/comparison
|
|
|
|
// functions.
|
|
|
|
void upb_strtable_insert(upb_strtable *t, const char *key, const void *val);
|
|
|
|
void upb_inttable_compact(upb_inttable *t);
|
|
|
|
|
|
|
|
INLINE uint32_t _upb_inttable_bucket(const upb_inttable *t, uint32_t k) {
|
|
|
|
uint32_t bucket = k & t->t.mask; // Identity hash for ints.
|
|
|
|
assert(bucket != UPB_END_OF_CHAIN);
|
|
|
|
return bucket;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Returns true if this key belongs in the array part of the table.
|
|
|
|
INLINE bool _upb_inttable_isarrkey(const upb_inttable *t, uint32_t k) {
|
|
|
|
return (k < t->array_size);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Looks up key in this table, returning a pointer to the user's inserted data.
|
|
|
|
// We have the caller specify the entry_size because fixing this as a literal
|
|
|
|
// (instead of reading table->entry_size) gives the compiler more ability to
|
|
|
|
// optimize.
|
|
|
|
//
|
|
|
|
// Note: All returned pointers are invalidated by inserts!
|
|
|
|
INLINE void *_upb_inttable_fastlookup(const upb_inttable *t, uint32_t key,
|
|
|
|
size_t entry_size, size_t value_size) {
|
|
|
|
upb_inttable_value *arrval =
|
|
|
|
(upb_inttable_value*)UPB_INDEX(t->array, key, value_size);
|
|
|
|
if (_upb_inttable_isarrkey(t, key)) {
|
|
|
|
return (arrval->has_entry) ? arrval : NULL;
|
|
|
|
}
|
|
|
|
uint32_t bucket = _upb_inttable_bucket(t, key);
|
|
|
|
upb_inttable_entry *e =
|
|
|
|
(upb_inttable_entry*)UPB_INDEX(t->t.entries, bucket, entry_size);
|
|
|
|
while (1) {
|
|
|
|
if (e->hdr.key == key) {
|
|
|
|
return &e->val;
|
|
|
|
}
|
|
|
|
if ((bucket = e->hdr.next) == UPB_END_OF_CHAIN) return NULL;
|
|
|
|
e = (upb_inttable_entry*)UPB_INDEX(t->t.entries, bucket, entry_size);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
INLINE size_t _upb_inttable_entrysize(size_t value_size) {
|
|
|
|
return upb_align_up(sizeof(upb_inttable_header) + value_size, 8);
|
|
|
|
}
|
|
|
|
|
|
|
|
INLINE void *upb_inttable_fastlookup(const upb_inttable *t, uint32_t key,
|
|
|
|
uint32_t value_size) {
|
|
|
|
return _upb_inttable_fastlookup(
|
|
|
|
t, key, _upb_inttable_entrysize(value_size), value_size);
|
|
|
|
}
|
|
|
|
|
|
|
|
INLINE void *upb_inttable_lookup(upb_inttable *t, uint32_t key) {
|
|
|
|
return _upb_inttable_fastlookup(t, key, t->t.entry_size, t->t.value_size);
|
|
|
|
}
|
|
|
|
|
|
|
|
void *upb_strtable_lookupl(const upb_strtable *t, const char *key, size_t len);
|
|
|
|
void *upb_strtable_lookup(const upb_strtable *t, const char *key);
|
|
|
|
|
|
|
|
|
|
|
|
/* upb_strtable_iter **********************************************************/
|
|
|
|
|
|
|
|
// Strtable iteration. Order is undefined. Insertions invalidate iterators.
|
|
|
|
// upb_strtable_iter i;
|
|
|
|
// for(upb_strtable_begin(&i, t); !upb_strtable_done(&i); upb_strtable_next(&i)) {
|
|
|
|
// const char *key = upb_strtable_iter_key(&i);
|
|
|
|
// const myval *val = upb_strtable_iter_value(&i);
|
|
|
|
// // ...
|
|
|
|
// }
|
|
|
|
typedef struct {
|
|
|
|
const upb_strtable *t;
|
|
|
|
upb_strtable_entry *e;
|
|
|
|
} upb_strtable_iter;
|
|
|
|
|
|
|
|
void upb_strtable_begin(upb_strtable_iter *i, const upb_strtable *t);
|
|
|
|
void upb_strtable_next(upb_strtable_iter *i);
|
|
|
|
INLINE bool upb_strtable_done(upb_strtable_iter *i) { return i->e == NULL; }
|
|
|
|
INLINE const char *upb_strtable_iter_key(upb_strtable_iter *i) {
|
|
|
|
return i->e->hdr.key;
|
|
|
|
}
|
|
|
|
INLINE const void *upb_strtable_iter_value(upb_strtable_iter *i) {
|
|
|
|
return &i->e->val;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/* upb_inttable_iter **********************************************************/
|
|
|
|
|
|
|
|
// Inttable iteration. Order is undefined. Insertions invalidate iterators.
|
|
|
|
// for(upb_inttable_iter i = upb_inttable_begin(t); !upb_inttable_done(i);
|
|
|
|
// i = upb_inttable_next(t, i)) {
|
|
|
|
// // ...
|
|
|
|
// }
|
|
|
|
typedef struct {
|
|
|
|
uint32_t key;
|
|
|
|
upb_inttable_value *value;
|
|
|
|
bool array_part;
|
|
|
|
} upb_inttable_iter;
|
|
|
|
|
|
|
|
upb_inttable_iter upb_inttable_begin(const upb_inttable *t);
|
|
|
|
upb_inttable_iter upb_inttable_next(const upb_inttable *t,
|
|
|
|
upb_inttable_iter iter);
|
|
|
|
INLINE bool upb_inttable_done(upb_inttable_iter iter) {
|
|
|
|
return iter.value == NULL;
|
|
|
|
}
|
|
|
|
INLINE uint32_t upb_inttable_iter_key(upb_inttable_iter iter) {
|
|
|
|
return iter.key;
|
|
|
|
}
|
|
|
|
INLINE void *upb_inttable_iter_value(upb_inttable_iter iter) {
|
|
|
|
return iter.value;
|
|
|
|
}
|
|
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
} /* extern "C" */
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#endif /* UPB_TABLE_H_ */
|