use uint32_t

This commit is contained in:
blueloveTH 2023-02-25 00:31:17 +08:00
parent 298739bfef
commit 43b7130f99
5 changed files with 95 additions and 81 deletions

View File

@ -73,4 +73,4 @@ struct Type {
const float kLocalsLoadFactor = 0.67; const float kLocalsLoadFactor = 0.67;
const float kInstAttrLoadFactor = 0.67; const float kInstAttrLoadFactor = 0.67;
const float kTypeAttrLoadFactor = 0.34; const float kTypeAttrLoadFactor = 0.5;

View File

@ -2,7 +2,7 @@
#include "codeobject.h" #include "codeobject.h"
static THREAD_LOCAL i64 kFrameGlobalId = 0; static THREAD_LOCAL uint64_t kFrameGlobalId = 0;
struct Frame { struct Frame {
std::vector<PyVar> _data; std::vector<PyVar> _data;
@ -11,10 +11,10 @@ struct Frame {
const CodeObject* co; const CodeObject* co;
PyVar _module; PyVar _module;
pkpy::shared_ptr<pkpy::NameDict> _locals; NameDict_ _locals;
pkpy::shared_ptr<pkpy::NameDict> _closure; NameDict_ _closure;
const i64 id; const uint64_t id;
std::stack<std::pair<int, std::vector<PyVar>>> s_try_block; std::vector<std::pair<int, std::vector<PyVar>>> s_try_block;
inline pkpy::NameDict& f_locals() noexcept { return _locals != nullptr ? *_locals : _module->attr(); } inline pkpy::NameDict& f_locals() noexcept { return _locals != nullptr ? *_locals : _module->attr(); }
inline pkpy::NameDict& f_globals() noexcept { return _module->attr(); } inline pkpy::NameDict& f_globals() noexcept { return _module->attr(); }
@ -24,9 +24,11 @@ struct Frame {
return _closure->try_get(name); return _closure->try_get(name);
} }
Frame(const CodeObject_& co, const PyVar& _module, Frame(const CodeObject_& co,
pkpy::shared_ptr<pkpy::NameDict> _locals=nullptr, pkpy::shared_ptr<pkpy::NameDict> _closure=nullptr) const PyVar& _module,
: co(co.get()), _module(_module), _locals(_locals), _closure(_closure), id(kFrameGlobalId++) { } const NameDict_& _locals=nullptr,
const NameDict_& _closure=nullptr)
: co(co.get()), _module(_module), _locals(_locals), _closure(_closure), id(kFrameGlobalId++) { }
inline const Bytecode& next_bytecode() { inline const Bytecode& next_bytecode() {
_ip = _next_ip++; _ip = _next_ip++;
@ -96,17 +98,17 @@ struct Frame {
inline void jump_rel(int i){ _next_ip += i; } inline void jump_rel(int i){ _next_ip += i; }
inline void on_try_block_enter(){ inline void on_try_block_enter(){
s_try_block.push(std::make_pair(co->codes[_ip].block, _data)); s_try_block.emplace_back(co->codes[_ip].block, _data);
} }
inline void on_try_block_exit(){ inline void on_try_block_exit(){
s_try_block.pop(); s_try_block.pop_back();
} }
bool jump_to_exception_handler(){ bool jump_to_exception_handler(){
if(s_try_block.empty()) return false; if(s_try_block.empty()) return false;
PyVar obj = pop(); PyVar obj = pop();
auto& p = s_try_block.top(); auto& p = s_try_block.back();
_data = std::move(p.second); _data = std::move(p.second);
_data.push_back(obj); _data.push_back(obj);
_next_ip = co->blocks[p.first].end; _next_ip = co->blocks[p.first].end;

View File

@ -4,16 +4,17 @@
#include "memory.h" #include "memory.h"
#include "str.h" #include "str.h"
const int kNameDictNodeSize = sizeof(StrName) + sizeof(PyVar);
template<int __Bucket, int __BucketSize=32> template<int __Bucket, int __BucketSize=32>
struct DictArrayPool { struct DictArrayPool {
std::deque<StrName*> buckets[__Bucket+1]; std::vector<StrName*> buckets[__Bucket+1];
StrName* alloc(uint32_t n){ StrName* alloc(uint16_t n){
StrName* _keys; StrName* _keys;
if(n > __Bucket || buckets[n].empty()){ if(n > __Bucket || buckets[n].empty()){
_keys = (StrName*)malloc((sizeof(StrName)+sizeof(PyVar)) * n); _keys = (StrName*)malloc(kNameDictNodeSize * n);
memset((void*)_keys, 0, (sizeof(StrName)+sizeof(PyVar)) * n); memset((void*)_keys, 0, kNameDictNodeSize * n);
}else{ }else{
_keys = buckets[n].back(); _keys = buckets[n].back();
memset((void*)_keys, 0, sizeof(StrName) * n); memset((void*)_keys, 0, sizeof(StrName) * n);
@ -22,7 +23,7 @@ struct DictArrayPool {
return _keys; return _keys;
} }
void dealloc(StrName* head, uint32_t n){ void dealloc(StrName* head, uint16_t n){
PyVar* _values = (PyVar*)(head + n); PyVar* _values = (PyVar*)(head + n);
if(n > __Bucket || buckets[n].size() >= __BucketSize){ if(n > __Bucket || buckets[n].size() >= __BucketSize){
for(int i=0; i<n; i++) _values[i].~PyVar(); for(int i=0; i<n; i++) _values[i].~PyVar();
@ -38,76 +39,89 @@ struct DictArrayPool {
}; };
namespace pkpy{ namespace pkpy{
const std::vector<uint32_t> kHashSeeds = {2654435761, 740041872, 89791836, 2530921597, 3099937610, 4149637300, 2701344377, 1871341841, 1162794509, 172427115, 1636841237, 716883023, 3294650677, 54921151, 3697702254, 632800580, 704251301, 1107400416, 3158440428, 581874317, 3196521560, 2374935651, 3196227762, 2033551959, 2028119291, 348132418, 392150876, 3839168722, 3705071505, 742931757, 2917622539, 3641634736, 3438863246, 1211314974, 1389620692, 3842835768, 165823282, 2225611914, 1862128271, 2147948325, 3759309280, 2087364973, 3453466014, 2082604761, 3627961499, 967790220, 3285133283, 2749567844, 262853493, 142639230, 3079101350, 2942333634, 1470374050, 3719337124, 2487858314, 1605159164, 2958061235, 3310454023, 3143584575, 3696188862, 3455413544, 148400163, 889426286, 1485235735}; const std::vector<uint16_t> kHashSeeds = {9629, 43049, 13267, 59509, 39251, 1249, 35803, 54469, 27689, 9719, 34897, 18973, 30661, 19913, 27919, 32143, 3467, 28019, 1051, 39419, 1361, 28547, 48197, 2609, 24317, 22861, 41467, 17623, 52837, 59053, 33589, 32117};
static DictArrayPool<32> _dict_pool; static DictArrayPool<32> _dict_pool;
uint32_t find_next_capacity(uint32_t n){ uint16_t find_next_capacity(uint16_t n){
uint32_t x = 2; uint16_t x = 2;
while(x < n) x *= 2; while(x < n) x <<= 1;
return x; return x;
} }
#define _hash(key, mask, hash_seed) ( ( (key).index * (hash_seed) >> 16 ) & (mask) ) #define _hash(key, mask, hash_seed) ( ( (key).index * (hash_seed) >> 8 ) & (mask) )
uint32_t find_perfect_hash_seed(uint32_t capacity, const std::vector<StrName>& keys){ uint16_t find_perfect_hash_seed(uint16_t capacity, const std::vector<StrName>& keys){
if(keys.empty()) return kHashSeeds[0]; if(keys.empty()) return kHashSeeds[0];
std::set<uint32_t> indices; std::set<uint16_t> indices;
std::vector<std::pair<uint32_t, float>> scores; std::pair<uint16_t, float> best_score = {kHashSeeds[0], 0};
for(int i=0; i<kHashSeeds.size(); i++){ for(int i=0; i<kHashSeeds.size(); i++){
indices.clear(); indices.clear();
for(auto key: keys){ for(auto key: keys){
uint32_t index = _hash(key, capacity-1, kHashSeeds[i]); uint16_t index = _hash(key, capacity-1, kHashSeeds[i]);
indices.insert(index); indices.insert(index);
} }
float score = indices.size() / (float)keys.size(); float score = indices.size() / (float)keys.size();
scores.push_back({kHashSeeds[i], score}); if(score > best_score.second) best_score = {kHashSeeds[i], score};
} }
std::sort(scores.begin(), scores.end(), [](auto a, auto b){ return a.second > b.second; }); return best_score.first;
return scores[0].first;
} }
struct NameDict { struct NameDict {
uint32_t _capacity; uint16_t _capacity;
uint32_t _size; uint16_t _size;
float _load_factor; float _load_factor;
uint32_t _hash_seed; uint16_t _hash_seed;
uint32_t _mask; uint16_t _mask;
StrName* _keys; StrName* _keys;
PyVar* _values;
inline void _alloc(uint32_t capacity){ inline PyVar& value(uint16_t i){
_keys = _dict_pool.alloc(capacity); return reinterpret_cast<PyVar*>(_keys + _capacity)[i];
_values = (PyVar*)(_keys + capacity);
} }
inline void _dealloc(StrName* head, uint32_t capacity){ inline const PyVar& value(uint16_t i) const {
return reinterpret_cast<const PyVar*>(_keys + _capacity)[i];
}
inline void _alloc(uint16_t capacity){
_keys = _dict_pool.alloc(capacity);
}
inline static void _dealloc(StrName* head, uint16_t capacity){
if(head == nullptr) return;
_dict_pool.dealloc(head, capacity); _dict_pool.dealloc(head, capacity);
} }
NameDict(uint32_t capacity=2, float load_factor=0.67, uint32_t hash_seed=kHashSeeds[0]): NameDict(uint16_t capacity=2, float load_factor=0.67, uint16_t hash_seed=kHashSeeds[0]):
_capacity(capacity), _size(0), _load_factor(load_factor), _capacity(capacity), _size(0), _load_factor(load_factor),
_hash_seed(hash_seed), _mask(capacity-1) { _hash_seed(hash_seed), _mask(capacity-1) {
_alloc(capacity); _alloc(capacity);
} }
NameDict(const NameDict& other) { NameDict(const NameDict& other) {
this->_capacity = other._capacity; memcpy(this, &other, sizeof(NameDict));
this->_size = other._size;
this->_load_factor = other._load_factor;
this->_hash_seed = other._hash_seed;
_alloc(_capacity); _alloc(_capacity);
this->_mask = other._mask; for(int i=0; i<_capacity; i++){
for(uint32_t i=0; i<_capacity; i++){
_keys[i] = other._keys[i]; _keys[i] = other._keys[i];
_values[i] = other._values[i]; value(i) = other.value(i);
} }
} }
NameDict& operator=(const NameDict&) = delete; NameDict& operator=(const NameDict& other) {
_dealloc(_keys, _capacity);
memcpy(this, &other, sizeof(NameDict));
_alloc(_capacity);
for(int i=0; i<_capacity; i++){
_keys[i] = other._keys[i];
value(i) = other.value(i);
}
return *this;
}
~NameDict(){ _dict_pool.dealloc(_keys, _capacity); }
NameDict(NameDict&&) = delete; NameDict(NameDict&&) = delete;
NameDict& operator=(NameDict&&) = delete; NameDict& operator=(NameDict&&) = delete;
uint16_t size() const { return _size; }
uint32_t size() const { return _size; }
#define HASH_PROBE(key, ok, i) \ #define HASH_PROBE(key, ok, i) \
ok = false; \ ok = false; \
@ -118,22 +132,22 @@ namespace pkpy{
} }
const PyVar& operator[](StrName key) const { const PyVar& operator[](StrName key) const {
bool ok; uint32_t i; bool ok; uint16_t i;
HASH_PROBE(key, ok, i); HASH_PROBE(key, ok, i);
if(!ok) throw std::out_of_range("NameDict key not found: " + key.str()); if(!ok) throw std::out_of_range("NameDict key not found: " + key.str());
return _values[i]; return value(i);
} }
PyVar& get(StrName key){ PyVar& get(StrName key){
bool ok; uint32_t i; bool ok; uint16_t i;
HASH_PROBE(key, ok, i); HASH_PROBE(key, ok, i);
if(!ok) throw std::out_of_range("NameDict key not found: " + key.str()); if(!ok) throw std::out_of_range("NameDict key not found: " + key.str());
return _values[i]; return value(i);
} }
template<typename T> template<typename T>
void set(StrName key, T&& value){ void set(StrName key, T&& val){
bool ok; uint32_t i; bool ok; uint16_t i;
HASH_PROBE(key, ok, i); HASH_PROBE(key, ok, i);
if(!ok) { if(!ok) {
_size++; _size++;
@ -143,25 +157,25 @@ namespace pkpy{
} }
_keys[i] = key; _keys[i] = key;
} }
_values[i] = std::forward<T>(value); value(i) = std::forward<T>(val);
} }
void _rehash(bool resize){ void _rehash(bool resize){
StrName* old_keys = _keys; StrName* old_keys = _keys;
PyVar* old_values = _values; PyVar* old_values = &value(0);
uint32_t old_capacity = _capacity; uint16_t old_capacity = _capacity;
if(resize){ if(resize){
_capacity = find_next_capacity(_capacity * 2); _capacity = find_next_capacity(_capacity * 2);
_mask = _capacity - 1; _mask = _capacity - 1;
} }
_alloc(_capacity); _alloc(_capacity);
for(uint32_t i=0; i<old_capacity; i++){ for(uint16_t i=0; i<old_capacity; i++){
if(old_keys[i].empty()) continue; if(old_keys[i].empty()) continue;
bool ok; uint32_t j; bool ok; uint16_t j;
HASH_PROBE(old_keys[i], ok, j); HASH_PROBE(old_keys[i], ok, j);
if(ok) UNREACHABLE(); if(ok) UNREACHABLE();
_keys[j] = old_keys[i]; _keys[j] = old_keys[i];
_values[j] = old_values[i]; // std::move makes a segfault value(j) = old_values[i]; // std::move makes a segfault
} }
_dealloc(old_keys, old_capacity); _dealloc(old_keys, old_capacity);
} }
@ -172,56 +186,53 @@ namespace pkpy{
} }
inline PyVar* try_get(StrName key){ inline PyVar* try_get(StrName key){
bool ok; uint32_t i; bool ok; uint16_t i;
HASH_PROBE(key, ok, i); HASH_PROBE(key, ok, i);
if(!ok) return nullptr; if(!ok) return nullptr;
return &_values[i]; return &value(i);
} }
inline bool try_set(StrName key, PyVar&& value){ inline bool try_set(StrName key, PyVar&& val){
bool ok; uint32_t i; bool ok; uint16_t i;
HASH_PROBE(key, ok, i); HASH_PROBE(key, ok, i);
if(!ok) return false; if(!ok) return false;
_values[i] = std::move(value); value(i) = std::move(val);
return true; return true;
} }
inline bool contains(StrName key) const { inline bool contains(StrName key) const {
bool ok; uint32_t i; bool ok; uint16_t i;
HASH_PROBE(key, ok, i); HASH_PROBE(key, ok, i);
return ok; return ok;
} }
~NameDict(){ _dealloc(_keys, _capacity); }
void update(const NameDict& other){ void update(const NameDict& other){
for(uint32_t i=0; i<other._capacity; i++){ for(uint16_t i=0; i<other._capacity; i++){
if(other._keys[i].empty()) continue; if(other._keys[i].empty()) continue;
set(other._keys[i], other._values[i]); set(other._keys[i], other.value(i));
} }
} }
void erase(StrName key){ void erase(StrName key){
bool ok; uint32_t i; bool ok; uint16_t i;
HASH_PROBE(key, ok, i); HASH_PROBE(key, ok, i);
if(!ok) throw std::out_of_range("NameDict key not found: " + key.str()); if(!ok) throw std::out_of_range("NameDict key not found: " + key.str());
_keys[i] = StrName(); _keys[i] = StrName(); value(i).reset();
_values[i].reset();
_size--; _size--;
} }
std::vector<std::pair<StrName, PyVar>> items() const { std::vector<std::pair<StrName, PyVar>> items() const {
std::vector<std::pair<StrName, PyVar>> v; std::vector<std::pair<StrName, PyVar>> v;
for(uint32_t i=0; i<_capacity; i++){ for(uint16_t i=0; i<_capacity; i++){
if(_keys[i].empty()) continue; if(_keys[i].empty()) continue;
v.push_back(std::make_pair(_keys[i], _values[i])); v.push_back(std::make_pair(_keys[i], value(i)));
} }
return v; return v;
} }
std::vector<StrName> keys() const { std::vector<StrName> keys() const {
std::vector<StrName> v; std::vector<StrName> v;
for(uint32_t i=0; i<_capacity; i++){ for(uint16_t i=0; i<_capacity; i++){
if(_keys[i].empty()) continue; if(_keys[i].empty()) continue;
v.push_back(_keys[i]); v.push_back(_keys[i]);
} }

View File

@ -10,6 +10,7 @@ class VM;
typedef std::function<PyVar(VM*, pkpy::Args&)> NativeFuncRaw; typedef std::function<PyVar(VM*, pkpy::Args&)> NativeFuncRaw;
typedef pkpy::shared_ptr<CodeObject> CodeObject_; typedef pkpy::shared_ptr<CodeObject> CodeObject_;
typedef pkpy::shared_ptr<pkpy::NameDict> NameDict_;
namespace pkpy{ namespace pkpy{
struct NativeFunc { struct NativeFunc {
@ -30,8 +31,8 @@ struct Function {
std::vector<StrName> kwargs_order; std::vector<StrName> kwargs_order;
// runtime settings // runtime settings
PyVar _module; PyVar _module = nullptr;
pkpy::shared_ptr<pkpy::NameDict> _closure; NameDict_ _closure = nullptr;
bool has_name(const Str& val) const { bool has_name(const Str& val) const {
bool _0 = std::find(args.begin(), args.end(), val) != args.end(); bool _0 = std::find(args.begin(), args.end(), val) != args.end();

View File

@ -159,7 +159,7 @@ public:
return f(this, args); return f(this, args);
} else if(is_type(*callable, tp_function)){ } else if(is_type(*callable, tp_function)){
const pkpy::Function& fn = PyFunction_AS_C(*callable); const pkpy::Function& fn = PyFunction_AS_C(*callable);
auto locals = pkpy::make_shared<pkpy::NameDict>( NameDict_ locals = pkpy::make_shared<pkpy::NameDict>(
fn.code->perfect_locals_capacity, fn.code->perfect_locals_capacity,
kLocalsLoadFactor, kLocalsLoadFactor,
fn.code->perfect_hash_seed fn.code->perfect_hash_seed
@ -218,7 +218,7 @@ public:
}catch (const pkpy::Exception& e){ }catch (const pkpy::Exception& e){
*_stderr << e.summary() << '\n'; *_stderr << e.summary() << '\n';
} }
#ifdef _NDEBUG #if !defined(__GNUC__)
catch (const std::exception& e) { catch (const std::exception& e) {
*_stderr << "An std::exception occurred! It could be a bug.\n"; *_stderr << "An std::exception occurred! It could be a bug.\n";
*_stderr << e.what() << '\n'; *_stderr << e.what() << '\n';