|
|
@@ -4,16 +4,17 @@
|
|
|
#include "memory.h"
|
|
|
#include "str.h"
|
|
|
|
|
|
+const int kNameDictNodeSize = sizeof(StrName) + sizeof(PyVar);
|
|
|
|
|
|
template<int __Bucket, int __BucketSize=32>
|
|
|
struct DictArrayPool {
|
|
|
- std::deque<StrName*> buckets[__Bucket+1];
|
|
|
+ std::vector<StrName*> buckets[__Bucket+1];
|
|
|
|
|
|
- StrName* alloc(uint32_t n){
|
|
|
+ StrName* alloc(uint16_t n){
|
|
|
StrName* _keys;
|
|
|
if(n > __Bucket || buckets[n].empty()){
|
|
|
- _keys = (StrName*)malloc((sizeof(StrName)+sizeof(PyVar)) * n);
|
|
|
- memset((void*)_keys, 0, (sizeof(StrName)+sizeof(PyVar)) * n);
|
|
|
+ _keys = (StrName*)malloc(kNameDictNodeSize * n);
|
|
|
+ memset((void*)_keys, 0, kNameDictNodeSize * n);
|
|
|
}else{
|
|
|
_keys = buckets[n].back();
|
|
|
memset((void*)_keys, 0, sizeof(StrName) * n);
|
|
|
@@ -22,7 +23,7 @@ struct DictArrayPool {
|
|
|
return _keys;
|
|
|
}
|
|
|
|
|
|
- void dealloc(StrName* head, uint32_t n){
|
|
|
+ void dealloc(StrName* head, uint16_t n){
|
|
|
PyVar* _values = (PyVar*)(head + n);
|
|
|
if(n > __Bucket || buckets[n].size() >= __BucketSize){
|
|
|
for(int i=0; i<n; i++) _values[i].~PyVar();
|
|
|
@@ -38,76 +39,89 @@ struct DictArrayPool {
|
|
|
};
|
|
|
|
|
|
namespace pkpy{
|
|
|
- const std::vector<uint32_t> kHashSeeds = {2654435761, 740041872, 89791836, 2530921597, 3099937610, 4149637300, 2701344377, 1871341841, 1162794509, 172427115, 1636841237, 716883023, 3294650677, 54921151, 3697702254, 632800580, 704251301, 1107400416, 3158440428, 581874317, 3196521560, 2374935651, 3196227762, 2033551959, 2028119291, 348132418, 392150876, 3839168722, 3705071505, 742931757, 2917622539, 3641634736, 3438863246, 1211314974, 1389620692, 3842835768, 165823282, 2225611914, 1862128271, 2147948325, 3759309280, 2087364973, 3453466014, 2082604761, 3627961499, 967790220, 3285133283, 2749567844, 262853493, 142639230, 3079101350, 2942333634, 1470374050, 3719337124, 2487858314, 1605159164, 2958061235, 3310454023, 3143584575, 3696188862, 3455413544, 148400163, 889426286, 1485235735};
|
|
|
+ const std::vector<uint16_t> kHashSeeds = {9629, 43049, 13267, 59509, 39251, 1249, 35803, 54469, 27689, 9719, 34897, 18973, 30661, 19913, 27919, 32143, 3467, 28019, 1051, 39419, 1361, 28547, 48197, 2609, 24317, 22861, 41467, 17623, 52837, 59053, 33589, 32117};
|
|
|
static DictArrayPool<32> _dict_pool;
|
|
|
|
|
|
- uint32_t find_next_capacity(uint32_t n){
|
|
|
- uint32_t x = 2;
|
|
|
- while(x < n) x *= 2;
|
|
|
+ uint16_t find_next_capacity(uint16_t n){
|
|
|
+ uint16_t x = 2;
|
|
|
+ while(x < n) x <<= 1;
|
|
|
return x;
|
|
|
}
|
|
|
|
|
|
-#define _hash(key, mask, hash_seed) ( ( (key).index * (hash_seed) >> 16 ) & (mask) )
|
|
|
+#define _hash(key, mask, hash_seed) ( ( (key).index * (hash_seed) >> 8 ) & (mask) )
|
|
|
|
|
|
- uint32_t find_perfect_hash_seed(uint32_t capacity, const std::vector<StrName>& keys){
|
|
|
+ uint16_t find_perfect_hash_seed(uint16_t capacity, const std::vector<StrName>& keys){
|
|
|
if(keys.empty()) return kHashSeeds[0];
|
|
|
- std::set<uint32_t> indices;
|
|
|
- std::vector<std::pair<uint32_t, float>> scores;
|
|
|
+ std::set<uint16_t> indices;
|
|
|
+ std::pair<uint16_t, float> best_score = {kHashSeeds[0], 0};
|
|
|
for(int i=0; i<kHashSeeds.size(); i++){
|
|
|
indices.clear();
|
|
|
for(auto key: keys){
|
|
|
- uint32_t index = _hash(key, capacity-1, kHashSeeds[i]);
|
|
|
+ uint16_t index = _hash(key, capacity-1, kHashSeeds[i]);
|
|
|
indices.insert(index);
|
|
|
}
|
|
|
float score = indices.size() / (float)keys.size();
|
|
|
- scores.push_back({kHashSeeds[i], score});
|
|
|
+ if(score > best_score.second) best_score = {kHashSeeds[i], score};
|
|
|
}
|
|
|
- std::sort(scores.begin(), scores.end(), [](auto a, auto b){ return a.second > b.second; });
|
|
|
- return scores[0].first;
|
|
|
+ return best_score.first;
|
|
|
}
|
|
|
|
|
|
struct NameDict {
|
|
|
- uint32_t _capacity;
|
|
|
- uint32_t _size;
|
|
|
+ uint16_t _capacity;
|
|
|
+ uint16_t _size;
|
|
|
float _load_factor;
|
|
|
- uint32_t _hash_seed;
|
|
|
- uint32_t _mask;
|
|
|
+ uint16_t _hash_seed;
|
|
|
+ uint16_t _mask;
|
|
|
StrName* _keys;
|
|
|
- PyVar* _values;
|
|
|
|
|
|
- inline void _alloc(uint32_t capacity){
|
|
|
+ inline PyVar& value(uint16_t i){
|
|
|
+ return reinterpret_cast<PyVar*>(_keys + _capacity)[i];
|
|
|
+ }
|
|
|
+
|
|
|
+ inline const PyVar& value(uint16_t i) const {
|
|
|
+ return reinterpret_cast<const PyVar*>(_keys + _capacity)[i];
|
|
|
+ }
|
|
|
+
|
|
|
+ inline void _alloc(uint16_t capacity){
|
|
|
_keys = _dict_pool.alloc(capacity);
|
|
|
- _values = (PyVar*)(_keys + capacity);
|
|
|
}
|
|
|
|
|
|
- inline void _dealloc(StrName* head, uint32_t capacity){
|
|
|
+ inline static void _dealloc(StrName* head, uint16_t capacity){
|
|
|
+ if(head == nullptr) return;
|
|
|
_dict_pool.dealloc(head, capacity);
|
|
|
}
|
|
|
|
|
|
- NameDict(uint32_t capacity=2, float load_factor=0.67, uint32_t hash_seed=kHashSeeds[0]):
|
|
|
+ NameDict(uint16_t capacity=2, float load_factor=0.67, uint16_t hash_seed=kHashSeeds[0]):
|
|
|
_capacity(capacity), _size(0), _load_factor(load_factor),
|
|
|
_hash_seed(hash_seed), _mask(capacity-1) {
|
|
|
_alloc(capacity);
|
|
|
}
|
|
|
|
|
|
NameDict(const NameDict& other) {
|
|
|
- this->_capacity = other._capacity;
|
|
|
- this->_size = other._size;
|
|
|
- this->_load_factor = other._load_factor;
|
|
|
- this->_hash_seed = other._hash_seed;
|
|
|
+ memcpy(this, &other, sizeof(NameDict));
|
|
|
+ _alloc(_capacity);
|
|
|
+ for(int i=0; i<_capacity; i++){
|
|
|
+ _keys[i] = other._keys[i];
|
|
|
+ value(i) = other.value(i);
|
|
|
+ }
|
|
|
+ }
|
|
|
+
|
|
|
+ NameDict& operator=(const NameDict& other) {
|
|
|
+ _dealloc(_keys, _capacity);
|
|
|
+ memcpy(this, &other, sizeof(NameDict));
|
|
|
_alloc(_capacity);
|
|
|
- this->_mask = other._mask;
|
|
|
- for(uint32_t i=0; i<_capacity; i++){
|
|
|
+ for(int i=0; i<_capacity; i++){
|
|
|
_keys[i] = other._keys[i];
|
|
|
- _values[i] = other._values[i];
|
|
|
+ value(i) = other.value(i);
|
|
|
}
|
|
|
+ return *this;
|
|
|
}
|
|
|
|
|
|
- NameDict& operator=(const NameDict&) = delete;
|
|
|
+ ~NameDict(){ _dict_pool.dealloc(_keys, _capacity); }
|
|
|
+
|
|
|
NameDict(NameDict&&) = delete;
|
|
|
NameDict& operator=(NameDict&&) = delete;
|
|
|
-
|
|
|
- uint32_t size() const { return _size; }
|
|
|
+ uint16_t size() const { return _size; }
|
|
|
|
|
|
#define HASH_PROBE(key, ok, i) \
|
|
|
ok = false; \
|
|
|
@@ -118,22 +132,22 @@ namespace pkpy{
|
|
|
}
|
|
|
|
|
|
const PyVar& operator[](StrName key) const {
|
|
|
- bool ok; uint32_t i;
|
|
|
+ bool ok; uint16_t i;
|
|
|
HASH_PROBE(key, ok, i);
|
|
|
if(!ok) throw std::out_of_range("NameDict key not found: " + key.str());
|
|
|
- return _values[i];
|
|
|
+ return value(i);
|
|
|
}
|
|
|
|
|
|
PyVar& get(StrName key){
|
|
|
- bool ok; uint32_t i;
|
|
|
+ bool ok; uint16_t i;
|
|
|
HASH_PROBE(key, ok, i);
|
|
|
if(!ok) throw std::out_of_range("NameDict key not found: " + key.str());
|
|
|
- return _values[i];
|
|
|
+ return value(i);
|
|
|
}
|
|
|
|
|
|
template<typename T>
|
|
|
- void set(StrName key, T&& value){
|
|
|
- bool ok; uint32_t i;
|
|
|
+ void set(StrName key, T&& val){
|
|
|
+ bool ok; uint16_t i;
|
|
|
HASH_PROBE(key, ok, i);
|
|
|
if(!ok) {
|
|
|
_size++;
|
|
|
@@ -143,25 +157,25 @@ namespace pkpy{
|
|
|
}
|
|
|
_keys[i] = key;
|
|
|
}
|
|
|
- _values[i] = std::forward<T>(value);
|
|
|
+ value(i) = std::forward<T>(val);
|
|
|
}
|
|
|
|
|
|
void _rehash(bool resize){
|
|
|
StrName* old_keys = _keys;
|
|
|
- PyVar* old_values = _values;
|
|
|
- uint32_t old_capacity = _capacity;
|
|
|
+ PyVar* old_values = &value(0);
|
|
|
+ uint16_t old_capacity = _capacity;
|
|
|
if(resize){
|
|
|
_capacity = find_next_capacity(_capacity * 2);
|
|
|
_mask = _capacity - 1;
|
|
|
}
|
|
|
_alloc(_capacity);
|
|
|
- for(uint32_t i=0; i<old_capacity; i++){
|
|
|
+ for(uint16_t i=0; i<old_capacity; i++){
|
|
|
if(old_keys[i].empty()) continue;
|
|
|
- bool ok; uint32_t j;
|
|
|
+ bool ok; uint16_t j;
|
|
|
HASH_PROBE(old_keys[i], ok, j);
|
|
|
if(ok) UNREACHABLE();
|
|
|
_keys[j] = old_keys[i];
|
|
|
- _values[j] = old_values[i]; // std::move makes a segfault
|
|
|
+ value(j) = old_values[i]; // std::move makes a segfault
|
|
|
}
|
|
|
_dealloc(old_keys, old_capacity);
|
|
|
}
|
|
|
@@ -172,56 +186,53 @@ namespace pkpy{
|
|
|
}
|
|
|
|
|
|
inline PyVar* try_get(StrName key){
|
|
|
- bool ok; uint32_t i;
|
|
|
+ bool ok; uint16_t i;
|
|
|
HASH_PROBE(key, ok, i);
|
|
|
if(!ok) return nullptr;
|
|
|
- return &_values[i];
|
|
|
+ return &value(i);
|
|
|
}
|
|
|
|
|
|
- inline bool try_set(StrName key, PyVar&& value){
|
|
|
- bool ok; uint32_t i;
|
|
|
+ inline bool try_set(StrName key, PyVar&& val){
|
|
|
+ bool ok; uint16_t i;
|
|
|
HASH_PROBE(key, ok, i);
|
|
|
if(!ok) return false;
|
|
|
- _values[i] = std::move(value);
|
|
|
+ value(i) = std::move(val);
|
|
|
return true;
|
|
|
}
|
|
|
|
|
|
inline bool contains(StrName key) const {
|
|
|
- bool ok; uint32_t i;
|
|
|
+ bool ok; uint16_t i;
|
|
|
HASH_PROBE(key, ok, i);
|
|
|
return ok;
|
|
|
}
|
|
|
|
|
|
- ~NameDict(){ _dealloc(_keys, _capacity); }
|
|
|
-
|
|
|
void update(const NameDict& other){
|
|
|
- for(uint32_t i=0; i<other._capacity; i++){
|
|
|
+ for(uint16_t i=0; i<other._capacity; i++){
|
|
|
if(other._keys[i].empty()) continue;
|
|
|
- set(other._keys[i], other._values[i]);
|
|
|
+ set(other._keys[i], other.value(i));
|
|
|
}
|
|
|
}
|
|
|
|
|
|
void erase(StrName key){
|
|
|
- bool ok; uint32_t i;
|
|
|
+ bool ok; uint16_t i;
|
|
|
HASH_PROBE(key, ok, i);
|
|
|
if(!ok) throw std::out_of_range("NameDict key not found: " + key.str());
|
|
|
- _keys[i] = StrName();
|
|
|
- _values[i].reset();
|
|
|
+ _keys[i] = StrName(); value(i).reset();
|
|
|
_size--;
|
|
|
}
|
|
|
|
|
|
std::vector<std::pair<StrName, PyVar>> items() const {
|
|
|
std::vector<std::pair<StrName, PyVar>> v;
|
|
|
- for(uint32_t i=0; i<_capacity; i++){
|
|
|
+ for(uint16_t i=0; i<_capacity; i++){
|
|
|
if(_keys[i].empty()) continue;
|
|
|
- v.push_back(std::make_pair(_keys[i], _values[i]));
|
|
|
+ v.push_back(std::make_pair(_keys[i], value(i)));
|
|
|
}
|
|
|
return v;
|
|
|
}
|
|
|
|
|
|
std::vector<StrName> keys() const {
|
|
|
std::vector<StrName> v;
|
|
|
- for(uint32_t i=0; i<_capacity; i++){
|
|
|
+ for(uint16_t i=0; i<_capacity; i++){
|
|
|
if(_keys[i].empty()) continue;
|
|
|
v.push_back(_keys[i]);
|
|
|
}
|