mirror of
https://github.com/pocketpy/pocketpy
synced 2025-10-20 03:20:18 +00:00
337 lines
9.1 KiB
C++
337 lines
9.1 KiB
C++
#pragma once
|
|
|
|
#include "common.h"
|
|
#include "memory.h"
|
|
#include "str.h"
|
|
|
|
namespace pkpy{
|
|
|
|
template<typename T>
|
|
constexpr T default_invalid_value(){
|
|
if constexpr(std::is_pointer_v<T>) return nullptr;
|
|
else if constexpr(std::is_same_v<int, T>) return -1;
|
|
else return Discarded();
|
|
}
|
|
|
|
#define PK_SMALL_NAME_DICT_CAPACITY 8
|
|
#define PK_SMALL_NAME_DICT_LOOP(B) for(int i=0; i<PK_SMALL_NAME_DICT_CAPACITY; i++) { B }
|
|
|
|
template<typename V>
|
|
struct SmallNameDict{
|
|
using K = StrName;
|
|
static_assert(std::is_pod_v<V>);
|
|
|
|
bool _is_small;
|
|
uint16_t _size;
|
|
K _keys[PK_SMALL_NAME_DICT_CAPACITY];
|
|
V _values[PK_SMALL_NAME_DICT_CAPACITY];
|
|
|
|
SmallNameDict(): _is_small(true), _size(0) {}
|
|
|
|
bool try_set(K key, V val){
|
|
PK_SMALL_NAME_DICT_LOOP(
|
|
if(_keys[i] == key){ _values[i] = val; return true; }
|
|
)
|
|
|
|
if(_size == PK_SMALL_NAME_DICT_CAPACITY) return false;
|
|
if(_keys[_size].empty()){
|
|
_keys[_size] = key;
|
|
_values[_size] = val;
|
|
_size++;
|
|
return true;
|
|
}
|
|
|
|
PK_SMALL_NAME_DICT_LOOP(
|
|
if(_keys[i].empty()){
|
|
_keys[i] = key;
|
|
_values[i] = val;
|
|
_size++;
|
|
return true;
|
|
}
|
|
)
|
|
PK_UNREACHABLE();
|
|
}
|
|
|
|
V try_get(K key) const {
|
|
PK_SMALL_NAME_DICT_LOOP(
|
|
if(_keys[i] == key) return _values[i];
|
|
)
|
|
return default_invalid_value<V>();
|
|
}
|
|
|
|
V* try_get_2(K key) {
|
|
PK_SMALL_NAME_DICT_LOOP(
|
|
if(_keys[i] == key) return &_values[i];
|
|
)
|
|
return nullptr;
|
|
}
|
|
|
|
bool del(K key){
|
|
PK_SMALL_NAME_DICT_LOOP(
|
|
if(_keys[i] == key){ _keys[i] = StrName(); _size--; return true; }
|
|
)
|
|
return false;
|
|
}
|
|
|
|
template<typename Func>
|
|
void apply(Func func) const {
|
|
PK_SMALL_NAME_DICT_LOOP(
|
|
if(!_keys[i].empty()) func(_keys[i], _values[i]);
|
|
)
|
|
}
|
|
|
|
void clear(){
|
|
PK_SMALL_NAME_DICT_LOOP(
|
|
_keys[i] = StrName();
|
|
)
|
|
_size = 0;
|
|
}
|
|
|
|
uint16_t size() const { return _size; }
|
|
uint16_t capacity() const { return PK_SMALL_NAME_DICT_CAPACITY; }
|
|
};
|
|
|
|
template<typename T>
|
|
struct LargeNameDict {
|
|
PK_ALWAYS_PASS_BY_POINTER(LargeNameDict)
|
|
|
|
using Item = std::pair<StrName, T>;
|
|
static constexpr uint16_t kInitialCapacity = 32;
|
|
static_assert(is_pod<T>::value);
|
|
|
|
bool _is_small;
|
|
float _load_factor;
|
|
uint16_t _size;
|
|
|
|
uint16_t _capacity;
|
|
uint16_t _critical_size;
|
|
uint16_t _mask;
|
|
|
|
Item* _items;
|
|
|
|
#define HASH_PROBE_1(key, ok, i) \
|
|
ok = false; \
|
|
i = key.index & _mask; \
|
|
while(!_items[i].first.empty()) { \
|
|
if(_items[i].first == (key)) { ok = true; break; } \
|
|
i = (i + 1) & _mask; \
|
|
}
|
|
|
|
#define HASH_PROBE_0 HASH_PROBE_1
|
|
|
|
LargeNameDict(float load_factor=PK_INST_ATTR_LOAD_FACTOR): _is_small(false), _load_factor(load_factor), _size(0) {
|
|
_set_capacity_and_alloc_items(kInitialCapacity);
|
|
}
|
|
|
|
~LargeNameDict(){ free(_items); }
|
|
|
|
uint16_t size() const { return _size; }
|
|
uint16_t capacity() const { return _capacity; }
|
|
|
|
void _set_capacity_and_alloc_items(uint16_t val){
|
|
_capacity = val;
|
|
_critical_size = val * _load_factor;
|
|
_mask = val - 1;
|
|
|
|
_items = (Item*)malloc(_capacity * sizeof(Item));
|
|
memset(_items, 0, _capacity * sizeof(Item));
|
|
}
|
|
|
|
void set(StrName key, T val){
|
|
bool ok; uint16_t i;
|
|
HASH_PROBE_1(key, ok, i);
|
|
if(!ok) {
|
|
_size++;
|
|
if(_size > _critical_size){
|
|
_rehash_2x();
|
|
HASH_PROBE_1(key, ok, i);
|
|
}
|
|
_items[i].first = key;
|
|
}
|
|
_items[i].second = val;
|
|
}
|
|
|
|
void _rehash_2x(){
|
|
Item* old_items = _items;
|
|
uint16_t old_capacity = _capacity;
|
|
_set_capacity_and_alloc_items(_capacity * 2);
|
|
for(uint16_t i=0; i<old_capacity; i++){
|
|
if(old_items[i].first.empty()) continue;
|
|
bool ok; uint16_t j;
|
|
HASH_PROBE_1(old_items[i].first, ok, j);
|
|
if(ok) PK_FATAL_ERROR();
|
|
_items[j] = old_items[i];
|
|
}
|
|
free(old_items);
|
|
}
|
|
|
|
T try_get(StrName key) const{
|
|
bool ok; uint16_t i;
|
|
HASH_PROBE_0(key, ok, i);
|
|
if(!ok) return default_invalid_value<T>();
|
|
return _items[i].second;
|
|
}
|
|
|
|
T* try_get_2(StrName key) {
|
|
bool ok; uint16_t i;
|
|
HASH_PROBE_0(key, ok, i);
|
|
if(!ok) return nullptr;
|
|
return &_items[i].second;
|
|
}
|
|
|
|
T try_get_likely_found(StrName key) const{
|
|
uint16_t i = key.index & _mask;
|
|
if(_items[i].first == key) return _items[i].second;
|
|
i = (i + 1) & _mask;
|
|
if(_items[i].first == key) return _items[i].second;
|
|
return try_get(key);
|
|
}
|
|
|
|
T* try_get_2_likely_found(StrName key) {
|
|
uint16_t i = key.index & _mask;
|
|
if(_items[i].first == key) return &_items[i].second;
|
|
i = (i + 1) & _mask;
|
|
if(_items[i].first == key) return &_items[i].second;
|
|
return try_get_2(key);
|
|
}
|
|
|
|
bool del(StrName key){
|
|
bool ok; uint16_t i;
|
|
HASH_PROBE_0(key, ok, i);
|
|
if(!ok) return false;
|
|
_items[i].first = StrName();
|
|
_items[i].second = nullptr;
|
|
_size--;
|
|
// tidy
|
|
uint16_t pre_z = i;
|
|
uint16_t z = (i + 1) & _mask;
|
|
while(!_items[z].first.empty()){
|
|
uint16_t h = _items[z].first.index & _mask;
|
|
if(h != i) break;
|
|
std::swap(_items[pre_z], _items[z]);
|
|
pre_z = z;
|
|
z = (z + 1) & _mask;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
template<typename __Func>
|
|
void apply(__Func func) const {
|
|
for(uint16_t i=0; i<_capacity; i++){
|
|
if(_items[i].first.empty()) continue;
|
|
func(_items[i].first, _items[i].second);
|
|
}
|
|
}
|
|
|
|
std::vector<StrName> keys() const {
|
|
std::vector<StrName> v;
|
|
for(uint16_t i=0; i<_capacity; i++){
|
|
if(_items[i].first.empty()) continue;
|
|
v.push_back(_items[i].first);
|
|
}
|
|
return v;
|
|
}
|
|
|
|
void clear(){
|
|
for(uint16_t i=0; i<_capacity; i++){
|
|
_items[i].first = StrName();
|
|
_items[i].second = nullptr;
|
|
}
|
|
_size = 0;
|
|
}
|
|
#undef HASH_PROBE_0
|
|
#undef HASH_PROBE_1
|
|
};
|
|
|
|
template<typename V>
|
|
struct NameDictImpl{
|
|
PK_ALWAYS_PASS_BY_POINTER(NameDictImpl)
|
|
|
|
union{
|
|
SmallNameDict<V> _small;
|
|
LargeNameDict<V> _large;
|
|
};
|
|
|
|
NameDictImpl(): _small() {}
|
|
NameDictImpl(float load_factor): _large(load_factor) {}
|
|
|
|
bool is_small() const{
|
|
const bool* p = reinterpret_cast<const bool*>(this);
|
|
return *p;
|
|
}
|
|
|
|
void set(StrName key, V val){
|
|
if(is_small()){
|
|
bool ok = _small.try_set(key, val);
|
|
if(!ok){
|
|
SmallNameDict<V> copied(_small);
|
|
// move to large name dict
|
|
new (&_large) LargeNameDict<V>();
|
|
copied.apply([&](StrName key, V val){
|
|
_large.set(key, val);
|
|
});
|
|
_large.set(key, val);
|
|
}
|
|
}else{
|
|
_large.set(key, val);
|
|
}
|
|
}
|
|
|
|
uint16_t size() const{ return is_small() ?_small.size() : _large.size(); }
|
|
uint16_t capacity() const{ return is_small() ?_small.capacity() : _large.capacity(); }
|
|
V try_get(StrName key) const { return is_small() ?_small.try_get(key) : _large.try_get(key); }
|
|
V* try_get_2(StrName key) { return is_small() ?_small.try_get_2(key) : _large.try_get_2(key); }
|
|
bool del(StrName key){ return is_small() ?_small.del(key) : _large.del(key); }
|
|
|
|
V try_get_likely_found(StrName key) const { return is_small() ?_small.try_get(key) : _large.try_get_likely_found(key); }
|
|
V* try_get_2_likely_found(StrName key) { return is_small() ?_small.try_get_2(key) : _large.try_get_2_likely_found(key); }
|
|
|
|
bool contains(StrName key) const { return try_get(key) != default_invalid_value<V>(); }
|
|
|
|
V operator[](StrName key) const {
|
|
V val = try_get_likely_found(key);
|
|
if(val == default_invalid_value<V>()){
|
|
throw std::runtime_error(fmt("NameDict key not found: ", key.escape()).str());
|
|
}
|
|
return val;
|
|
}
|
|
|
|
void clear(){
|
|
if(is_small()) _small.clear();
|
|
else _large.clear();
|
|
}
|
|
|
|
template<typename Func>
|
|
void apply(Func func) const {
|
|
if(is_small()) _small.apply(func);
|
|
else _large.apply(func);
|
|
}
|
|
|
|
std::vector<StrName> keys() const{
|
|
std::vector<StrName> v;
|
|
apply([&](StrName key, V val){
|
|
v.push_back(key);
|
|
});
|
|
return v;
|
|
}
|
|
|
|
std::vector<std::pair<StrName, V>> items() const{
|
|
std::vector<std::pair<StrName, V>> v;
|
|
apply([&](StrName key, V val){
|
|
v.push_back({key, val});
|
|
});
|
|
return v;
|
|
}
|
|
|
|
~NameDictImpl(){
|
|
if(!is_small()) _large.~LargeNameDict<V>();
|
|
}
|
|
};
|
|
|
|
using NameDict = NameDictImpl<PyObject*>;
|
|
using NameDict_ = std::shared_ptr<NameDict>;
|
|
using NameDictInt = NameDictImpl<int>;
|
|
|
|
static_assert(sizeof(NameDict) <= 128);
|
|
|
|
} // namespace pkpy
|