|
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407 |
- /*
- * Copyright (c) 2009-2021, Google LLC
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions are met:
- * * Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- * * Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in the
- * documentation and/or other materials provided with the distribution.
- * * Neither the name of Google LLC nor the
- * names of its contributors may be used to endorse or promote products
- * derived from this software without specific prior written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- * ARE DISCLAIMED. IN NO EVENT SHALL Google LLC BE LIABLE FOR ANY DIRECT,
- * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
- * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
- * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
- * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- */
-
- /*
- * upb_table
- *
- * This header is INTERNAL-ONLY! Its interfaces are not public or stable!
- * This file defines very fast int->upb_value (inttable) and string->upb_value
- * (strtable) hash tables.
- *
- * The table uses chained scatter with Brent's variation (inspired by the Lua
- * implementation of hash tables). The hash function for strings is Austin
- * Appleby's "MurmurHash."
- *
- * The inttable uses uintptr_t as its key, which guarantees it can be used to
- * store pointers or integers of at least 32 bits (upb isn't really useful on
- * systems where sizeof(void*) < 4).
- *
- * The table must be homogeneous (all values of the same type). In debug
- * mode, we check this on insert and lookup.
- */
-
- #ifndef UPB_INTERNAL_TABLE_H_
- #define UPB_INTERNAL_TABLE_H_
-
- #include <stdint.h>
- #include <string.h>
-
- #include "upb/upb.h"
-
- // Must be last.
- #include "upb/port_def.inc"
-
- #ifdef __cplusplus
- extern "C"
- {
- #endif
-
- /* upb_value ******************************************************************/
-
- typedef struct
- {
- uint64_t val;
- } upb_value;
-
- /* Variant that works with a length-delimited rather than NULL-delimited string,
- * as supported by strtable. */
- char* upb_strdup2(const char* s, size_t len, upb_Arena* a);
-
- UPB_INLINE void _upb_value_setval(upb_value* v, uint64_t val)
- {
- v->val = val;
- }
-
- /* For each value ctype, define the following set of functions:
- *
- * // Get/set an int32 from a upb_value.
- * int32_t upb_value_getint32(upb_value val);
- * void upb_value_setint32(upb_value *val, int32_t cval);
- *
- * // Construct a new upb_value from an int32.
- * upb_value upb_value_int32(int32_t val); */
- #define FUNCS(name, membername, type_t, converter, proto_type) \
- UPB_INLINE void upb_value_set##name(upb_value* val, type_t cval) \
- { \
- val->val = (converter)cval; \
- } \
- UPB_INLINE upb_value upb_value_##name(type_t val) \
- { \
- upb_value ret; \
- upb_value_set##name(&ret, val); \
- return ret; \
- } \
- UPB_INLINE type_t upb_value_get##name(upb_value val) \
- { \
- return (type_t)(converter)val.val; \
- }
-
- FUNCS(int32, int32, int32_t, int32_t, UPB_CTYPE_INT32)
- FUNCS(int64, int64, int64_t, int64_t, UPB_CTYPE_INT64)
- FUNCS(uint32, uint32, uint32_t, uint32_t, UPB_CTYPE_UINT32)
- FUNCS(uint64, uint64, uint64_t, uint64_t, UPB_CTYPE_UINT64)
- FUNCS(bool, _bool, bool, bool, UPB_CTYPE_BOOL)
- FUNCS(cstr, cstr, char*, uintptr_t, UPB_CTYPE_CSTR)
- FUNCS(ptr, ptr, void*, uintptr_t, UPB_CTYPE_PTR)
- FUNCS(constptr, constptr, const void*, uintptr_t, UPB_CTYPE_CONSTPTR)
-
- #undef FUNCS
-
- UPB_INLINE void upb_value_setfloat(upb_value* val, float cval)
- {
- memcpy(&val->val, &cval, sizeof(cval));
- }
-
- UPB_INLINE void upb_value_setdouble(upb_value* val, double cval)
- {
- memcpy(&val->val, &cval, sizeof(cval));
- }
-
- UPB_INLINE upb_value upb_value_float(float cval)
- {
- upb_value ret;
- upb_value_setfloat(&ret, cval);
- return ret;
- }
-
- UPB_INLINE upb_value upb_value_double(double cval)
- {
- upb_value ret;
- upb_value_setdouble(&ret, cval);
- return ret;
- }
-
- #undef SET_TYPE
-
- /* upb_tabkey *****************************************************************/
-
- /* Either:
- * 1. an actual integer key, or
- * 2. a pointer to a string prefixed by its uint32_t length, owned by us.
- *
- * ...depending on whether this is a string table or an int table. We would
- * make this a union of those two types, but C89 doesn't support statically
- * initializing a non-first union member. */
- typedef uintptr_t upb_tabkey;
-
- UPB_INLINE char* upb_tabstr(upb_tabkey key, uint32_t* len)
- {
- char* mem = (char*)key;
- if (len)
- memcpy(len, mem, sizeof(*len));
- return mem + sizeof(*len);
- }
-
- UPB_INLINE upb_StringView upb_tabstrview(upb_tabkey key)
- {
- upb_StringView ret;
- uint32_t len;
- ret.data = upb_tabstr(key, &len);
- ret.size = len;
- return ret;
- }
-
- /* upb_tabval *****************************************************************/
-
- typedef struct upb_tabval
- {
- uint64_t val;
- } upb_tabval;
-
- #define UPB_TABVALUE_EMPTY_INIT \
- { \
- -1 \
- }
-
- /* upb_table ******************************************************************/
-
- typedef struct _upb_tabent
- {
- upb_tabkey key;
- upb_tabval val;
-
- /* Internal chaining. This is const so we can create static initializers for
- * tables. We cast away const sometimes, but *only* when the containing
- * upb_table is known to be non-const. This requires a bit of care, but
- * the subtlety is confined to table.c. */
- const struct _upb_tabent* next;
- } upb_tabent;
-
- typedef struct
- {
- size_t count; /* Number of entries in the hash part. */
- uint32_t mask; /* Mask to turn hash value -> bucket. */
- uint32_t max_count; /* Max count before we hit our load limit. */
- uint8_t size_lg2; /* Size of the hashtable part is 2^size_lg2 entries. */
- upb_tabent* entries;
- } upb_table;
-
- typedef struct
- {
- upb_table t;
- } upb_strtable;
-
- typedef struct
- {
- upb_table t; /* For entries that don't fit in the array part. */
- const upb_tabval* array; /* Array part of the table. See const note above. */
- size_t array_size; /* Array part size. */
- size_t array_count; /* Array part number of elements. */
- } upb_inttable;
-
- UPB_INLINE size_t upb_table_size(const upb_table* t)
- {
- if (t->size_lg2 == 0)
- return 0;
- else
- return 1 << t->size_lg2;
- }
-
- /* Internal-only functions, in .h file only out of necessity. */
- UPB_INLINE bool upb_tabent_isempty(const upb_tabent* e)
- {
- return e->key == 0;
- }
-
- /* Initialize and uninitialize a table, respectively. If memory allocation
- * failed, false is returned that the table is uninitialized. */
- bool upb_inttable_init(upb_inttable* table, upb_Arena* a);
- bool upb_strtable_init(upb_strtable* table, size_t expected_size, upb_Arena* a);
-
- /* Returns the number of values in the table. */
- size_t upb_inttable_count(const upb_inttable* t);
- UPB_INLINE size_t upb_strtable_count(const upb_strtable* t)
- {
- return t->t.count;
- }
-
- void upb_strtable_clear(upb_strtable* t);
-
- /* Inserts the given key into the hashtable with the given value. The key must
- * not already exist in the hash table. For strtables, the key is not required
- * to be NULL-terminated, and the table will make an internal copy of the key.
- * Inttables must not insert a value of UINTPTR_MAX.
- *
- * If a table resize was required but memory allocation failed, false is
- * returned and the table is unchanged. */
- bool upb_inttable_insert(upb_inttable* t, uintptr_t key, upb_value val, upb_Arena* a);
- bool upb_strtable_insert(upb_strtable* t, const char* key, size_t len, upb_value val, upb_Arena* a);
-
- /* Looks up key in this table, returning "true" if the key was found.
- * If v is non-NULL, copies the value for this key into *v. */
- bool upb_inttable_lookup(const upb_inttable* t, uintptr_t key, upb_value* v);
- bool upb_strtable_lookup2(const upb_strtable* t, const char* key, size_t len, upb_value* v);
-
- /* For NULL-terminated strings. */
- UPB_INLINE bool upb_strtable_lookup(const upb_strtable* t, const char* key, upb_value* v)
- {
- return upb_strtable_lookup2(t, key, strlen(key), v);
- }
-
- /* Removes an item from the table. Returns true if the remove was successful,
- * and stores the removed item in *val if non-NULL. */
- bool upb_inttable_remove(upb_inttable* t, uintptr_t key, upb_value* val);
- bool upb_strtable_remove2(upb_strtable* t, const char* key, size_t len, upb_value* val);
-
- UPB_INLINE bool upb_strtable_remove(upb_strtable* t, const char* key, upb_value* v)
- {
- return upb_strtable_remove2(t, key, strlen(key), v);
- }
-
- /* Updates an existing entry in an inttable. If the entry does not exist,
- * returns false and does nothing. Unlike insert/remove, this does not
- * invalidate iterators. */
- bool upb_inttable_replace(upb_inttable* t, uintptr_t key, upb_value val);
-
- /* Optimizes the table for the current set of entries, for both memory use and
- * lookup time. Client should call this after all entries have been inserted;
- * inserting more entries is legal, but will likely require a table resize. */
- void upb_inttable_compact(upb_inttable* t, upb_Arena* a);
-
- /* Exposed for testing only. */
- bool upb_strtable_resize(upb_strtable* t, size_t size_lg2, upb_Arena* a);
-
- /* Iterators ******************************************************************/
-
- /* Iteration over inttable.
- *
- * intptr_t iter = UPB_INTTABLE_BEGIN;
- * uintptr_t key;
- * upb_value val;
- * while (upb_inttable_next2(t, &key, &val, &iter)) {
- * // ...
- * }
- */
-
- #define UPB_INTTABLE_BEGIN -1
-
- bool upb_inttable_next2(const upb_inttable* t, uintptr_t* key, upb_value* val, intptr_t* iter);
- void upb_inttable_removeiter(upb_inttable* t, intptr_t* iter);
-
- /* Iteration over strtable.
- *
- * intptr_t iter = UPB_INTTABLE_BEGIN;
- * upb_StringView key;
- * upb_value val;
- * while (upb_strtable_next2(t, &key, &val, &iter)) {
- * // ...
- * }
- */
-
- #define UPB_STRTABLE_BEGIN -1
-
- bool upb_strtable_next2(const upb_strtable* t, upb_StringView* key, upb_value* val, intptr_t* iter);
- void upb_strtable_removeiter(upb_strtable* t, intptr_t* iter);
-
- /* DEPRECATED iterators, slated for removal.
- *
- * Iterators for int and string tables. We are subject to some kind of unusual
- * design constraints:
- *
- * For high-level languages:
- * - we must be able to guarantee that we don't crash or corrupt memory even if
- * the program accesses an invalidated iterator.
- *
- * For C++11 range-based for:
- * - iterators must be copyable
- * - iterators must be comparable
- * - it must be possible to construct an "end" value.
- *
- * Iteration order is undefined.
- *
- * Modifying the table invalidates iterators. upb_{str,int}table_done() is
- * guaranteed to work even on an invalidated iterator, as long as the table it
- * is iterating over has not been freed. Calling next() or accessing data from
- * an invalidated iterator yields unspecified elements from the table, but it is
- * guaranteed not to crash and to return real table elements (except when done()
- * is true). */
-
- /* upb_strtable_iter **********************************************************/
-
- /* upb_strtable_iter i;
- * upb_strtable_begin(&i, t);
- * for(; !upb_strtable_done(&i); upb_strtable_next(&i)) {
- * const char *key = upb_strtable_iter_key(&i);
- * const upb_value val = upb_strtable_iter_value(&i);
- * // ...
- * }
- */
-
- typedef struct
- {
- const upb_strtable* t;
- size_t index;
- } upb_strtable_iter;
-
- void upb_strtable_begin(upb_strtable_iter* i, const upb_strtable* t);
- void upb_strtable_next(upb_strtable_iter* i);
- bool upb_strtable_done(const upb_strtable_iter* i);
- upb_StringView upb_strtable_iter_key(const upb_strtable_iter* i);
- upb_value upb_strtable_iter_value(const upb_strtable_iter* i);
- void upb_strtable_iter_setdone(upb_strtable_iter* i);
- bool upb_strtable_iter_isequal(const upb_strtable_iter* i1, const upb_strtable_iter* i2);
-
- /* upb_inttable_iter **********************************************************/
-
- /* upb_inttable_iter i;
- * upb_inttable_begin(&i, t);
- * for(; !upb_inttable_done(&i); upb_inttable_next(&i)) {
- * uintptr_t key = upb_inttable_iter_key(&i);
- * upb_value val = upb_inttable_iter_value(&i);
- * // ...
- * }
- */
-
- typedef struct
- {
- const upb_inttable* t;
- size_t index;
- bool array_part;
- } upb_inttable_iter;
-
- UPB_INLINE const upb_tabent* str_tabent(const upb_strtable_iter* i)
- {
- return &i->t->t.entries[i->index];
- }
-
- void upb_inttable_begin(upb_inttable_iter* i, const upb_inttable* t);
- void upb_inttable_next(upb_inttable_iter* i);
- bool upb_inttable_done(const upb_inttable_iter* i);
- uintptr_t upb_inttable_iter_key(const upb_inttable_iter* i);
- upb_value upb_inttable_iter_value(const upb_inttable_iter* i);
- void upb_inttable_iter_setdone(upb_inttable_iter* i);
- bool upb_inttable_iter_isequal(const upb_inttable_iter* i1, const upb_inttable_iter* i2);
-
- uint32_t _upb_Hash(const void* p, size_t n, uint64_t seed);
-
- #ifdef __cplusplus
- } /* extern "C" */
- #endif
-
- #include "upb/port_undef.inc"
-
- #endif /* UPB_INTERNAL_TABLE_H_ */
|