mirror of
https://github.com/pocketpy/pocketpy
synced 2025-10-20 11:30:18 +00:00
2378 lines
81 KiB
C
2378 lines
81 KiB
C
#include "pocketpy/compiler/compiler.h"
|
|
#include "pocketpy/compiler/lexer.h"
|
|
#include "pocketpy/objects/sourcedata.h"
|
|
#include "pocketpy/objects/object.h"
|
|
#include "pocketpy/common/strname.h"
|
|
#include "pocketpy/common/config.h"
|
|
#include "pocketpy/common/memorypool.h"
|
|
#include <ctype.h>
|
|
|
|
/* expr.h */
|
|
typedef struct Expr Expr;
|
|
typedef struct Ctx Ctx;
|
|
|
|
typedef struct ExprVt {
|
|
/* emit */
|
|
void (*emit_)(Expr*, Ctx*);
|
|
bool (*emit_del)(Expr*, Ctx*);
|
|
bool (*emit_store)(Expr*, Ctx*);
|
|
void (*emit_inplace)(Expr*, Ctx*);
|
|
bool (*emit_istore)(Expr*, Ctx*);
|
|
/* reflections */
|
|
bool is_literal;
|
|
bool is_json_object;
|
|
bool is_name; // NameExpr
|
|
bool is_tuple; // TupleExpr
|
|
bool is_attrib; // AttribExpr
|
|
bool is_subscr; // SubscrExpr
|
|
bool is_starred; // StarredExpr
|
|
bool is_binary; // BinaryExpr
|
|
void (*dtor)(Expr*);
|
|
} ExprVt;
|
|
|
|
#define static_assert_expr_size(T) static_assert(sizeof(T) <= kPoolExprBlockSize, "")
|
|
|
|
#define vtcall(f, self, ctx) ((self)->vt->f((self), (ctx)))
|
|
#define vtemit_(self, ctx) vtcall(emit_, (self), (ctx))
|
|
#define vtemit_del(self, ctx) ((self)->vt->emit_del ? vtcall(emit_del, self, ctx) : false)
|
|
#define vtemit_store(self, ctx) ((self)->vt->emit_store ? vtcall(emit_store, self, ctx) : false)
|
|
#define vtemit_inplace(self, ctx) \
|
|
((self)->vt->emit_inplace ? vtcall(emit_inplace, self, ctx) : vtemit_(self, ctx))
|
|
#define vtemit_istore(self, ctx) \
|
|
((self)->vt->emit_istore ? vtcall(emit_istore, self, ctx) : vtemit_store(self, ctx))
|
|
#define vtdelete(self) \
|
|
do { \
|
|
if(self) { \
|
|
if((self)->vt->dtor) (self)->vt->dtor(self); \
|
|
PoolExpr_dealloc(self); \
|
|
} \
|
|
} while(0)
|
|
|
|
#define EXPR_COMMON_HEADER \
|
|
const ExprVt* vt; \
|
|
int line;
|
|
|
|
typedef struct Expr {
|
|
EXPR_COMMON_HEADER
|
|
} Expr;
|
|
|
|
/* context.h */
|
|
typedef struct Ctx {
|
|
CodeObject* co; // 1 CodeEmitContext <=> 1 CodeObject*
|
|
FuncDecl* func; // optional, weakref
|
|
int level;
|
|
int curr_iblock;
|
|
bool is_compiling_class;
|
|
c11_vector /*T=Expr* */ s_expr;
|
|
c11_smallmap_n2i global_names;
|
|
c11_smallmap_s2n co_consts_string_dedup_map;
|
|
} Ctx;
|
|
|
|
typedef struct Expr Expr;
|
|
|
|
static void Ctx__ctor(Ctx* self, CodeObject* co, FuncDecl* func, int level);
|
|
static void Ctx__dtor(Ctx* self);
|
|
static int Ctx__get_loop(Ctx* self);
|
|
static CodeBlock* Ctx__enter_block(Ctx* self, CodeBlockType type);
|
|
static void Ctx__exit_block(Ctx* self);
|
|
static int Ctx__emit_(Ctx* self, Opcode opcode, uint16_t arg, int line);
|
|
static int Ctx__emit_virtual(Ctx* self, Opcode opcode, uint16_t arg, int line, bool virtual);
|
|
static void Ctx__revert_last_emit_(Ctx* self);
|
|
static int Ctx__emit_int(Ctx* self, int64_t value, int line);
|
|
static void Ctx__patch_jump(Ctx* self, int index);
|
|
static bool Ctx__add_label(Ctx* self, py_Name name);
|
|
static int Ctx__add_varname(Ctx* self, py_Name name);
|
|
static int Ctx__add_const(Ctx* self, py_Ref);
|
|
static int Ctx__add_const_string(Ctx* self, c11_sv);
|
|
static void Ctx__emit_store_name(Ctx* self, NameScope scope, py_Name name, int line);
|
|
static void Ctx__try_merge_for_iter_store(Ctx* self, int);
|
|
static void Ctx__s_emit_top(Ctx*); // emit top -> pop -> delete
|
|
static void Ctx__s_push(Ctx*, Expr*); // push
|
|
static Expr* Ctx__s_top(Ctx*); // top
|
|
static int Ctx__s_size(Ctx*); // size
|
|
static void Ctx__s_pop(Ctx*); // pop -> delete
|
|
static Expr* Ctx__s_popx(Ctx*); // pop move
|
|
static void Ctx__s_emit_decorators(Ctx*, int count);
|
|
|
|
/* expr.c */
|
|
typedef struct NameExpr {
|
|
EXPR_COMMON_HEADER
|
|
py_Name name;
|
|
NameScope scope;
|
|
} NameExpr;
|
|
|
|
void NameExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
NameExpr* self = (NameExpr*)self_;
|
|
int index = c11_smallmap_n2i__get(&ctx->co->varnames_inv, self->name, -1);
|
|
if(self->scope == NAME_LOCAL && index >= 0) {
|
|
Ctx__emit_(ctx, OP_LOAD_FAST, index, self->line);
|
|
} else {
|
|
Opcode op = ctx->level <= 1 ? OP_LOAD_GLOBAL : OP_LOAD_NONLOCAL;
|
|
if(ctx->is_compiling_class && self->scope == NAME_GLOBAL) {
|
|
// if we are compiling a class, we should use OP_LOAD_ATTR_GLOBAL instead of
|
|
// OP_LOAD_GLOBAL this supports @property.setter
|
|
op = OP_LOAD_CLASS_GLOBAL;
|
|
// exec()/eval() won't work with OP_LOAD_ATTR_GLOBAL in class body
|
|
} else {
|
|
// we cannot determine the scope when calling exec()/eval()
|
|
if(self->scope == NAME_GLOBAL_UNKNOWN) op = OP_LOAD_NAME;
|
|
}
|
|
Ctx__emit_(ctx, op, self->name, self->line);
|
|
}
|
|
}
|
|
|
|
bool NameExpr__emit_del(Expr* self_, Ctx* ctx) {
|
|
NameExpr* self = (NameExpr*)self_;
|
|
switch(self->scope) {
|
|
case NAME_LOCAL:
|
|
Ctx__emit_(ctx, OP_DELETE_FAST, Ctx__add_varname(ctx, self->name), self->line);
|
|
break;
|
|
case NAME_GLOBAL: Ctx__emit_(ctx, OP_DELETE_GLOBAL, self->name, self->line); break;
|
|
case NAME_GLOBAL_UNKNOWN: Ctx__emit_(ctx, OP_DELETE_NAME, self->name, self->line); break;
|
|
default: c11__unreachedable();
|
|
}
|
|
return true;
|
|
}
|
|
|
|
bool NameExpr__emit_store(Expr* self_, Ctx* ctx) {
|
|
NameExpr* self = (NameExpr*)self_;
|
|
if(ctx->is_compiling_class) {
|
|
Ctx__emit_(ctx, OP_STORE_CLASS_ATTR, self->name, self->line);
|
|
return true;
|
|
}
|
|
Ctx__emit_store_name(ctx, self->scope, self->name, self->line);
|
|
return true;
|
|
}
|
|
|
|
NameExpr* NameExpr__new(int line, py_Name name, NameScope scope) {
|
|
const static ExprVt Vt = {.emit_ = NameExpr__emit_,
|
|
.emit_del = NameExpr__emit_del,
|
|
.emit_store = NameExpr__emit_store,
|
|
.is_name = true};
|
|
static_assert_expr_size(NameExpr);
|
|
NameExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->name = name;
|
|
self->scope = scope;
|
|
return self;
|
|
}
|
|
|
|
typedef struct StarredExpr {
|
|
EXPR_COMMON_HEADER
|
|
Expr* child;
|
|
int level;
|
|
} StarredExpr;
|
|
|
|
void StarredExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
StarredExpr* self = (StarredExpr*)self_;
|
|
vtemit_(self->child, ctx);
|
|
Ctx__emit_(ctx, OP_UNARY_STAR, self->level, self->line);
|
|
}
|
|
|
|
bool StarredExpr__emit_store(Expr* self_, Ctx* ctx) {
|
|
StarredExpr* self = (StarredExpr*)self_;
|
|
if(self->level != 1) return false;
|
|
// simply proxy to child
|
|
return vtemit_store(self->child, ctx);
|
|
}
|
|
|
|
StarredExpr* StarredExpr__new(int line, Expr* child, int level) {
|
|
const static ExprVt Vt = {.emit_ = StarredExpr__emit_,
|
|
.emit_store = StarredExpr__emit_store,
|
|
.is_starred = true};
|
|
static_assert_expr_size(StarredExpr);
|
|
StarredExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->child = child;
|
|
self->level = level;
|
|
return self;
|
|
}
|
|
|
|
// InvertExpr, NotExpr, NegatedExpr
|
|
// NOTE: NegatedExpr always contains a non-const child. Should not generate -1 or -0.1
|
|
typedef struct UnaryExpr {
|
|
EXPR_COMMON_HEADER
|
|
Expr* child;
|
|
Opcode opcode;
|
|
} UnaryExpr;
|
|
|
|
void UnaryExpr__dtor(Expr* self_) {
|
|
UnaryExpr* self = (UnaryExpr*)self_;
|
|
vtdelete(self->child);
|
|
}
|
|
|
|
static void UnaryExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
UnaryExpr* self = (UnaryExpr*)self_;
|
|
vtemit_(self->child, ctx);
|
|
Ctx__emit_(ctx, self->opcode, BC_NOARG, self->line);
|
|
}
|
|
|
|
UnaryExpr* UnaryExpr__new(int line, Expr* child, Opcode opcode) {
|
|
const static ExprVt Vt = {.emit_ = UnaryExpr__emit_, .dtor = UnaryExpr__dtor};
|
|
static_assert_expr_size(UnaryExpr);
|
|
UnaryExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->child = child;
|
|
self->opcode = opcode;
|
|
return self;
|
|
}
|
|
|
|
typedef struct RawStringExpr {
|
|
EXPR_COMMON_HEADER
|
|
c11_sv value;
|
|
Opcode opcode;
|
|
} RawStringExpr;
|
|
|
|
void RawStringExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
RawStringExpr* self = (RawStringExpr*)self_;
|
|
int index = Ctx__add_const_string(ctx, self->value);
|
|
Ctx__emit_(ctx, OP_LOAD_CONST, index, self->line);
|
|
Ctx__emit_(ctx, self->opcode, BC_NOARG, self->line);
|
|
}
|
|
|
|
RawStringExpr* RawStringExpr__new(int line, c11_sv value, Opcode opcode) {
|
|
const static ExprVt Vt = {.emit_ = RawStringExpr__emit_};
|
|
static_assert_expr_size(RawStringExpr);
|
|
RawStringExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->value = value;
|
|
self->opcode = opcode;
|
|
return self;
|
|
}
|
|
|
|
typedef struct ImagExpr {
|
|
EXPR_COMMON_HEADER
|
|
double value;
|
|
} ImagExpr;
|
|
|
|
void ImagExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
ImagExpr* self = (ImagExpr*)self_;
|
|
py_TValue value;
|
|
py_newfloat(&value, self->value);
|
|
int index = Ctx__add_const(ctx, &value);
|
|
Ctx__emit_(ctx, OP_LOAD_CONST, index, self->line);
|
|
Ctx__emit_(ctx, OP_BUILD_IMAG, BC_NOARG, self->line);
|
|
}
|
|
|
|
ImagExpr* ImagExpr__new(int line, double value) {
|
|
const static ExprVt Vt = {.emit_ = ImagExpr__emit_};
|
|
static_assert_expr_size(ImagExpr);
|
|
ImagExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->value = value;
|
|
return self;
|
|
}
|
|
|
|
typedef struct LiteralExpr {
|
|
EXPR_COMMON_HEADER
|
|
const TokenValue* value;
|
|
} LiteralExpr;
|
|
|
|
void LiteralExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
LiteralExpr* self = (LiteralExpr*)self_;
|
|
switch(self->value->index) {
|
|
case TokenValue_I64: {
|
|
int64_t val = self->value->_i64;
|
|
Ctx__emit_int(ctx, val, self->line);
|
|
break;
|
|
}
|
|
case TokenValue_F64: {
|
|
py_TValue value;
|
|
py_newfloat(&value, self->value->_f64);
|
|
int index = Ctx__add_const(ctx, &value);
|
|
Ctx__emit_(ctx, OP_LOAD_CONST, index, self->line);
|
|
break;
|
|
}
|
|
case TokenValue_STR: {
|
|
c11_sv sv = c11_string__sv(self->value->_str);
|
|
int index = Ctx__add_const_string(ctx, sv);
|
|
Ctx__emit_(ctx, OP_LOAD_CONST, index, self->line);
|
|
break;
|
|
}
|
|
default: c11__unreachedable();
|
|
}
|
|
}
|
|
|
|
LiteralExpr* LiteralExpr__new(int line, const TokenValue* value) {
|
|
const static ExprVt Vt = {.emit_ = LiteralExpr__emit_,
|
|
.is_literal = true,
|
|
.is_json_object = true};
|
|
static_assert_expr_size(LiteralExpr);
|
|
LiteralExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->value = value;
|
|
return self;
|
|
}
|
|
|
|
typedef struct Literal0Expr {
|
|
EXPR_COMMON_HEADER
|
|
TokenIndex token;
|
|
} Literal0Expr;
|
|
|
|
void Literal0Expr__emit_(Expr* self_, Ctx* ctx) {
|
|
Literal0Expr* self = (Literal0Expr*)self_;
|
|
Opcode opcode;
|
|
switch(self->token) {
|
|
case TK_NONE: opcode = OP_LOAD_NONE; break;
|
|
case TK_TRUE: opcode = OP_LOAD_TRUE; break;
|
|
case TK_FALSE: opcode = OP_LOAD_FALSE; break;
|
|
case TK_DOTDOTDOT: opcode = OP_LOAD_ELLIPSIS; break;
|
|
default: assert(false);
|
|
}
|
|
Ctx__emit_(ctx, opcode, BC_NOARG, self->line);
|
|
}
|
|
|
|
Literal0Expr* Literal0Expr__new(int line, TokenIndex token) {
|
|
const static ExprVt Vt = {.emit_ = Literal0Expr__emit_,
|
|
.is_literal = true,
|
|
.is_json_object = true};
|
|
static_assert_expr_size(Literal0Expr);
|
|
Literal0Expr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->token = token;
|
|
return self;
|
|
}
|
|
|
|
typedef struct SliceExpr {
|
|
EXPR_COMMON_HEADER
|
|
Expr* start;
|
|
Expr* stop;
|
|
Expr* step;
|
|
} SliceExpr;
|
|
|
|
void SliceExpr__dtor(Expr* self_) {
|
|
SliceExpr* self = (SliceExpr*)self_;
|
|
vtdelete(self->start);
|
|
vtdelete(self->stop);
|
|
vtdelete(self->step);
|
|
}
|
|
|
|
void SliceExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
SliceExpr* self = (SliceExpr*)self_;
|
|
if(self->start)
|
|
vtemit_(self->start, ctx);
|
|
else
|
|
Ctx__emit_(ctx, OP_LOAD_NONE, BC_NOARG, self->line);
|
|
if(self->stop)
|
|
vtemit_(self->stop, ctx);
|
|
else
|
|
Ctx__emit_(ctx, OP_LOAD_NONE, BC_NOARG, self->line);
|
|
if(self->step)
|
|
vtemit_(self->step, ctx);
|
|
else
|
|
Ctx__emit_(ctx, OP_LOAD_NONE, BC_NOARG, self->line);
|
|
Ctx__emit_(ctx, OP_BUILD_SLICE, BC_NOARG, self->line);
|
|
}
|
|
|
|
SliceExpr* SliceExpr__new(int line) {
|
|
const static ExprVt Vt = {.dtor = SliceExpr__dtor, .emit_ = SliceExpr__emit_};
|
|
static_assert_expr_size(SliceExpr);
|
|
SliceExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->start = NULL;
|
|
self->stop = NULL;
|
|
self->step = NULL;
|
|
return self;
|
|
}
|
|
|
|
// ListExpr, DictExpr, SetExpr, TupleExpr
|
|
typedef struct SequenceExpr {
|
|
EXPR_COMMON_HEADER
|
|
c11_array /*T=Expr* */ items;
|
|
Opcode opcode;
|
|
} SequenceExpr;
|
|
|
|
static void SequenceExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
SequenceExpr* self = (SequenceExpr*)self_;
|
|
for(int i = 0; i < self->items.count; i++) {
|
|
Expr* item = c11__getitem(Expr*, &self->items, i);
|
|
vtemit_(item, ctx);
|
|
}
|
|
Ctx__emit_(ctx, self->opcode, self->items.count, self->line);
|
|
}
|
|
|
|
void SequenceExpr__dtor(Expr* self_) {
|
|
SequenceExpr* self = (SequenceExpr*)self_;
|
|
c11__foreach(Expr*, &self->items, e) vtdelete(*e);
|
|
c11_array__dtor(&self->items);
|
|
}
|
|
|
|
bool TupleExpr__emit_store(Expr* self_, Ctx* ctx) {
|
|
SequenceExpr* self = (SequenceExpr*)self_;
|
|
// TOS is an iterable
|
|
// items may contain StarredExpr, we should check it
|
|
int starred_i = -1;
|
|
for(int i = 0; i < self->items.count; i++) {
|
|
Expr* e = c11__getitem(Expr*, &self->items, i);
|
|
if(e->vt->is_starred) {
|
|
if(((StarredExpr*)e)->level > 0) {
|
|
if(starred_i == -1)
|
|
starred_i = i;
|
|
else
|
|
return false; // multiple StarredExpr not allowed
|
|
}
|
|
}
|
|
}
|
|
|
|
if(starred_i == -1) {
|
|
Bytecode* prev = c11__at(Bytecode, &ctx->co->codes, ctx->co->codes.count - 1);
|
|
if(prev->op == OP_BUILD_TUPLE && prev->arg == self->items.count) {
|
|
// build tuple and unpack it is meaningless
|
|
Ctx__revert_last_emit_(ctx);
|
|
} else {
|
|
if(prev->op == OP_FOR_ITER) {
|
|
prev->op = OP_FOR_ITER_UNPACK;
|
|
prev->arg = self->items.count;
|
|
} else {
|
|
Ctx__emit_(ctx, OP_UNPACK_SEQUENCE, self->items.count, self->line);
|
|
}
|
|
}
|
|
} else {
|
|
// starred assignment target must be in a tuple
|
|
if(self->items.count == 1) return false;
|
|
// starred assignment target must be the last one (differ from cpython)
|
|
if(starred_i != self->items.count - 1) return false;
|
|
// a,*b = [1,2,3]
|
|
// stack is [1,2,3] -> [1,[2,3]]
|
|
Ctx__emit_(ctx, OP_UNPACK_EX, self->items.count - 1, self->line);
|
|
}
|
|
// do reverse emit
|
|
for(int i = self->items.count - 1; i >= 0; i--) {
|
|
Expr* e = c11__getitem(Expr*, &self->items, i);
|
|
bool ok = vtemit_store(e, ctx);
|
|
if(!ok) return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
bool TupleExpr__emit_del(Expr* self_, Ctx* ctx) {
|
|
SequenceExpr* self = (SequenceExpr*)self_;
|
|
c11__foreach(Expr*, &self->items, e) {
|
|
bool ok = vtemit_del(*e, ctx);
|
|
if(!ok) return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
static SequenceExpr* SequenceExpr__new(int line, const ExprVt* vt, int count, Opcode opcode) {
|
|
static_assert_expr_size(SequenceExpr);
|
|
SequenceExpr* self = PoolExpr_alloc();
|
|
self->vt = vt;
|
|
self->line = line;
|
|
self->opcode = opcode;
|
|
c11_array__ctor(&self->items, sizeof(Expr*), count);
|
|
return self;
|
|
}
|
|
|
|
SequenceExpr* ListExpr__new(int line, int count) {
|
|
const static ExprVt ListExprVt = {.dtor = SequenceExpr__dtor,
|
|
.emit_ = SequenceExpr__emit_,
|
|
.is_json_object = true};
|
|
return SequenceExpr__new(line, &ListExprVt, count, OP_BUILD_LIST);
|
|
}
|
|
|
|
SequenceExpr* DictExpr__new(int line, int count) {
|
|
const static ExprVt DictExprVt = {.dtor = SequenceExpr__dtor,
|
|
.emit_ = SequenceExpr__emit_,
|
|
.is_json_object = true};
|
|
return SequenceExpr__new(line, &DictExprVt, count, OP_BUILD_DICT);
|
|
}
|
|
|
|
SequenceExpr* SetExpr__new(int line, int count) {
|
|
const static ExprVt SetExprVt = {
|
|
.dtor = SequenceExpr__dtor,
|
|
.emit_ = SequenceExpr__emit_,
|
|
};
|
|
return SequenceExpr__new(line, &SetExprVt, count, OP_BUILD_SET);
|
|
}
|
|
|
|
SequenceExpr* TupleExpr__new(int line, int count) {
|
|
const static ExprVt TupleExprVt = {.dtor = SequenceExpr__dtor,
|
|
.emit_ = SequenceExpr__emit_,
|
|
.is_tuple = true,
|
|
.emit_store = TupleExpr__emit_store,
|
|
.emit_del = TupleExpr__emit_del};
|
|
return SequenceExpr__new(line, &TupleExprVt, count, OP_BUILD_TUPLE);
|
|
}
|
|
|
|
typedef struct CompExpr {
|
|
EXPR_COMMON_HEADER
|
|
Expr* expr; // loop expr
|
|
Expr* vars; // loop vars
|
|
Expr* iter; // loop iter
|
|
Expr* cond; // optional if condition
|
|
|
|
Opcode op0;
|
|
Opcode op1;
|
|
} CompExpr;
|
|
|
|
void CompExpr__dtor(Expr* self_) {
|
|
CompExpr* self = (CompExpr*)self_;
|
|
vtdelete(self->expr);
|
|
vtdelete(self->vars);
|
|
vtdelete(self->iter);
|
|
vtdelete(self->cond);
|
|
}
|
|
|
|
void CompExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
CompExpr* self = (CompExpr*)self_;
|
|
Ctx__emit_(ctx, self->op0, 0, self->line);
|
|
vtemit_(self->iter, ctx);
|
|
Ctx__emit_(ctx, OP_GET_ITER, BC_NOARG, BC_KEEPLINE);
|
|
Ctx__enter_block(ctx, CodeBlockType_FOR_LOOP);
|
|
int curr_iblock = ctx->curr_iblock;
|
|
int for_codei = Ctx__emit_(ctx, OP_FOR_ITER, curr_iblock, BC_KEEPLINE);
|
|
bool ok = vtemit_store(self->vars, ctx);
|
|
// this error occurs in `vars` instead of this line, but...nevermind
|
|
assert(ok); // this should raise a SyntaxError, but we just assert it
|
|
Ctx__try_merge_for_iter_store(ctx, for_codei);
|
|
if(self->cond) {
|
|
vtemit_(self->cond, ctx);
|
|
int patch = Ctx__emit_(ctx, OP_POP_JUMP_IF_FALSE, BC_NOARG, BC_KEEPLINE);
|
|
vtemit_(self->expr, ctx);
|
|
Ctx__emit_(ctx, self->op1, BC_NOARG, BC_KEEPLINE);
|
|
Ctx__patch_jump(ctx, patch);
|
|
} else {
|
|
vtemit_(self->expr, ctx);
|
|
Ctx__emit_(ctx, self->op1, BC_NOARG, BC_KEEPLINE);
|
|
}
|
|
Ctx__emit_(ctx, OP_LOOP_CONTINUE, curr_iblock, BC_KEEPLINE);
|
|
Ctx__exit_block(ctx);
|
|
}
|
|
|
|
CompExpr* CompExpr__new(int line, Opcode op0, Opcode op1) {
|
|
const static ExprVt Vt = {.dtor = CompExpr__dtor, .emit_ = CompExpr__emit_};
|
|
static_assert_expr_size(CompExpr);
|
|
CompExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->op0 = op0;
|
|
self->op1 = op1;
|
|
self->expr = NULL;
|
|
self->vars = NULL;
|
|
self->iter = NULL;
|
|
self->cond = NULL;
|
|
return self;
|
|
}
|
|
|
|
typedef struct LambdaExpr {
|
|
EXPR_COMMON_HEADER
|
|
int index;
|
|
} LambdaExpr;
|
|
|
|
static void LambdaExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
LambdaExpr* self = (LambdaExpr*)self_;
|
|
Ctx__emit_(ctx, OP_LOAD_FUNCTION, self->index, self->line);
|
|
}
|
|
|
|
LambdaExpr* LambdaExpr__new(int line, int index) {
|
|
const static ExprVt Vt = {.emit_ = LambdaExpr__emit_};
|
|
static_assert_expr_size(LambdaExpr);
|
|
LambdaExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->index = index;
|
|
return self;
|
|
}
|
|
|
|
typedef struct FStringExpr {
|
|
EXPR_COMMON_HEADER
|
|
c11_sv src;
|
|
} FStringExpr;
|
|
|
|
static bool is_fmt_valid_char(char c) {
|
|
switch(c) {
|
|
// clang-format off
|
|
case '-': case '=': case '*': case '#': case '@': case '!': case '~':
|
|
case '<': case '>': case '^':
|
|
case '.': case 'f': case 'd': case 's':
|
|
case '0': case '1': case '2': case '3': case '4': case '5': case '6': case '7': case '8': case '9':
|
|
return true;
|
|
default: return false;
|
|
// clang-format on
|
|
}
|
|
}
|
|
|
|
static bool is_identifier(c11_sv s) {
|
|
if(s.size == 0) return false;
|
|
if(!isalpha(s.data[0]) && s.data[0] != '_') return false;
|
|
for(int i = 0; i < s.size; i++) {
|
|
char c = s.data[i];
|
|
if(!isalnum(c) && c != '_') return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
static void _load_simple_expr(Ctx* ctx, c11_sv expr, int line) {
|
|
bool repr = false;
|
|
const char* expr_end = expr.data + expr.size;
|
|
if(expr.size >= 2 && expr_end[-2] == '!') {
|
|
switch(expr_end[-1]) {
|
|
case 'r':
|
|
repr = true;
|
|
expr.size -= 2; // expr[:-2]
|
|
break;
|
|
case 's':
|
|
repr = false;
|
|
expr.size -= 2; // expr[:-2]
|
|
break;
|
|
default: break; // nothing happens
|
|
}
|
|
}
|
|
// name or name.name
|
|
bool is_fastpath = false;
|
|
if(is_identifier(expr)) {
|
|
// ctx->emit_(OP_LOAD_NAME, py_Name(expr.sv()).index, line);
|
|
Ctx__emit_(ctx, OP_LOAD_NAME, py_name2(expr), line);
|
|
is_fastpath = true;
|
|
} else {
|
|
int dot = c11_sv__index(expr, '.');
|
|
if(dot > 0) {
|
|
c11_sv a = {expr.data, dot}; // expr[:dot]
|
|
c11_sv b = {expr.data + (dot + 1), expr.size - (dot + 1)}; // expr[dot+1:]
|
|
if(is_identifier(a) && is_identifier(b)) {
|
|
Ctx__emit_(ctx, OP_LOAD_NAME, py_name2(a), line);
|
|
Ctx__emit_(ctx, OP_LOAD_ATTR, py_name2(b), line);
|
|
is_fastpath = true;
|
|
}
|
|
}
|
|
}
|
|
|
|
if(!is_fastpath) {
|
|
int index = Ctx__add_const_string(ctx, expr);
|
|
Ctx__emit_(ctx, OP_FSTRING_EVAL, index, line);
|
|
}
|
|
|
|
if(repr) { Ctx__emit_(ctx, OP_REPR, BC_NOARG, line); }
|
|
}
|
|
|
|
static void FStringExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
FStringExpr* self = (FStringExpr*)self_;
|
|
int i = 0; // left index
|
|
int j = 0; // right index
|
|
int count = 0; // how many string parts
|
|
bool flag = false; // true if we are in a expression
|
|
|
|
const char* src = self->src.data;
|
|
while(j < self->src.size) {
|
|
if(flag) {
|
|
if(src[j] == '}') {
|
|
// add expression
|
|
c11_sv expr = {src + i, j - i}; // src[i:j]
|
|
// BUG: ':' is not a format specifier in f"{stack[2:]}"
|
|
int conon = c11_sv__index(expr, ':');
|
|
if(conon >= 0) {
|
|
c11_sv spec = {expr.data + (conon + 1),
|
|
expr.size - (conon + 1)}; // expr[conon+1:]
|
|
// filter some invalid spec
|
|
bool ok = true;
|
|
for(int k = 0; k < spec.size; k++) {
|
|
char c = spec.data[k];
|
|
if(!is_fmt_valid_char(c)) {
|
|
ok = false;
|
|
break;
|
|
}
|
|
}
|
|
if(ok) {
|
|
expr.size = conon; // expr[:conon]
|
|
_load_simple_expr(ctx, expr, self->line);
|
|
// ctx->emit_(OP_FORMAT_STRING, ctx->add_const_string(spec.sv()), line);
|
|
Ctx__emit_(ctx,
|
|
OP_FORMAT_STRING,
|
|
Ctx__add_const_string(ctx, spec),
|
|
self->line);
|
|
} else {
|
|
// ':' is not a spec indicator
|
|
_load_simple_expr(ctx, expr, self->line);
|
|
}
|
|
} else {
|
|
_load_simple_expr(ctx, expr, self->line);
|
|
}
|
|
flag = false;
|
|
count++;
|
|
}
|
|
} else {
|
|
if(src[j] == '{') {
|
|
// look at next char
|
|
if(j + 1 < self->src.size && src[j + 1] == '{') {
|
|
// {{ -> {
|
|
j++;
|
|
Ctx__emit_(ctx,
|
|
OP_LOAD_CONST,
|
|
Ctx__add_const_string(ctx, (c11_sv){"{", 1}),
|
|
self->line);
|
|
count++;
|
|
} else {
|
|
// { -> }
|
|
flag = true;
|
|
i = j + 1;
|
|
}
|
|
} else if(src[j] == '}') {
|
|
// look at next char
|
|
if(j + 1 < self->src.size && src[j + 1] == '}') {
|
|
// }} -> }
|
|
j++;
|
|
Ctx__emit_(ctx,
|
|
OP_LOAD_CONST,
|
|
Ctx__add_const_string(ctx, (c11_sv){"}", 1}),
|
|
self->line);
|
|
count++;
|
|
} else {
|
|
// } -> error
|
|
// throw std::runtime_error("f-string: unexpected }");
|
|
// just ignore
|
|
}
|
|
} else {
|
|
// literal
|
|
i = j;
|
|
while(j < self->src.size && src[j] != '{' && src[j] != '}')
|
|
j++;
|
|
c11_sv literal = {src + i, j - i}; // src[i:j]
|
|
Ctx__emit_(ctx, OP_LOAD_CONST, Ctx__add_const_string(ctx, literal), self->line);
|
|
count++;
|
|
continue; // skip j++
|
|
}
|
|
}
|
|
j++;
|
|
}
|
|
|
|
if(flag) {
|
|
// literal
|
|
c11_sv literal = {src + i, self->src.size - i}; // src[i:]
|
|
Ctx__emit_(ctx, OP_LOAD_CONST, Ctx__add_const_string(ctx, literal), self->line);
|
|
count++;
|
|
}
|
|
Ctx__emit_(ctx, OP_BUILD_STRING, count, self->line);
|
|
}
|
|
|
|
FStringExpr* FStringExpr__new(int line, c11_sv src) {
|
|
const static ExprVt Vt = {.emit_ = FStringExpr__emit_};
|
|
static_assert_expr_size(FStringExpr);
|
|
FStringExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->src = src;
|
|
return self;
|
|
}
|
|
|
|
// AndExpr, OrExpr
|
|
typedef struct LogicBinaryExpr {
|
|
EXPR_COMMON_HEADER
|
|
Expr* lhs;
|
|
Expr* rhs;
|
|
Opcode opcode;
|
|
} LogicBinaryExpr;
|
|
|
|
void LogicBinaryExpr__dtor(Expr* self_) {
|
|
LogicBinaryExpr* self = (LogicBinaryExpr*)self_;
|
|
vtdelete(self->lhs);
|
|
vtdelete(self->rhs);
|
|
}
|
|
|
|
void LogicBinaryExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
LogicBinaryExpr* self = (LogicBinaryExpr*)self_;
|
|
vtemit_(self->lhs, ctx);
|
|
int patch = Ctx__emit_(ctx, self->opcode, BC_NOARG, self->line);
|
|
vtemit_(self->rhs, ctx);
|
|
Ctx__patch_jump(ctx, patch);
|
|
}
|
|
|
|
LogicBinaryExpr* LogicBinaryExpr__new(int line, Opcode opcode) {
|
|
const static ExprVt Vt = {.emit_ = LogicBinaryExpr__emit_, .dtor = LogicBinaryExpr__dtor};
|
|
static_assert_expr_size(LogicBinaryExpr);
|
|
LogicBinaryExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->lhs = NULL;
|
|
self->rhs = NULL;
|
|
self->opcode = opcode;
|
|
return self;
|
|
}
|
|
|
|
typedef struct GroupedExpr {
|
|
EXPR_COMMON_HEADER
|
|
Expr* child;
|
|
} GroupedExpr;
|
|
|
|
void GroupedExpr__dtor(Expr* self_) {
|
|
GroupedExpr* self = (GroupedExpr*)self_;
|
|
vtdelete(self->child);
|
|
}
|
|
|
|
void GroupedExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
GroupedExpr* self = (GroupedExpr*)self_;
|
|
vtemit_(self->child, ctx);
|
|
}
|
|
|
|
bool GroupedExpr__emit_del(Expr* self_, Ctx* ctx) {
|
|
GroupedExpr* self = (GroupedExpr*)self_;
|
|
return vtemit_del(self->child, ctx);
|
|
}
|
|
|
|
bool GroupedExpr__emit_store(Expr* self_, Ctx* ctx) {
|
|
GroupedExpr* self = (GroupedExpr*)self_;
|
|
return vtemit_store(self->child, ctx);
|
|
}
|
|
|
|
GroupedExpr* GroupedExpr__new(int line, Expr* child) {
|
|
const static ExprVt Vt = {.dtor = GroupedExpr__dtor,
|
|
.emit_ = GroupedExpr__emit_,
|
|
.emit_del = GroupedExpr__emit_del,
|
|
.emit_store = GroupedExpr__emit_store};
|
|
static_assert_expr_size(GroupedExpr);
|
|
GroupedExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->child = child;
|
|
return self;
|
|
}
|
|
|
|
typedef struct BinaryExpr {
|
|
EXPR_COMMON_HEADER
|
|
Expr* lhs;
|
|
Expr* rhs;
|
|
TokenIndex op;
|
|
bool inplace;
|
|
} BinaryExpr;
|
|
|
|
static void BinaryExpr__dtor(Expr* self_) {
|
|
BinaryExpr* self = (BinaryExpr*)self_;
|
|
vtdelete(self->lhs);
|
|
vtdelete(self->rhs);
|
|
}
|
|
|
|
static py_Name cmp_token2name(TokenIndex token) {
|
|
switch(token) {
|
|
case TK_LT: return __lt__;
|
|
case TK_LE: return __le__;
|
|
case TK_EQ: return __eq__;
|
|
case TK_NE: return __ne__;
|
|
case TK_GT: return __gt__;
|
|
case TK_GE: return __ge__;
|
|
default: return 0;
|
|
}
|
|
}
|
|
|
|
#define is_compare_expr(e) ((e)->vt->is_binary && cmp_token2name(((BinaryExpr*)(e))->op))
|
|
|
|
static void _emit_compare(BinaryExpr* self, Ctx* ctx, c11_vector* jmps) {
|
|
if(is_compare_expr(self->lhs)) {
|
|
_emit_compare((BinaryExpr*)self->lhs, ctx, jmps);
|
|
} else {
|
|
vtemit_(self->lhs, ctx); // [a]
|
|
}
|
|
vtemit_(self->rhs, ctx); // [a, b]
|
|
Ctx__emit_(ctx, OP_DUP_TOP, BC_NOARG, self->line); // [a, b, b]
|
|
Ctx__emit_(ctx, OP_ROT_THREE, BC_NOARG, self->line); // [b, a, b]
|
|
Ctx__emit_(ctx, OP_BINARY_OP, cmp_token2name(self->op), self->line);
|
|
// [b, RES]
|
|
int index = Ctx__emit_(ctx, OP_JUMP_IF_FALSE_OR_POP, BC_NOARG, self->line);
|
|
c11_vector__push(int, jmps, index);
|
|
}
|
|
|
|
static void BinaryExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
BinaryExpr* self = (BinaryExpr*)self_;
|
|
c11_vector /*T=int*/ jmps;
|
|
c11_vector__ctor(&jmps, sizeof(int));
|
|
if(cmp_token2name(self->op) && is_compare_expr(self->lhs)) {
|
|
// (a < b) < c
|
|
BinaryExpr* e = (BinaryExpr*)self->lhs;
|
|
_emit_compare(e, ctx, &jmps);
|
|
// [b, RES]
|
|
} else {
|
|
// (1 + 2) < c
|
|
if(self->inplace) {
|
|
vtemit_inplace(self->lhs, ctx);
|
|
} else {
|
|
vtemit_(self->lhs, ctx);
|
|
}
|
|
}
|
|
|
|
vtemit_(self->rhs, ctx);
|
|
|
|
Opcode opcode = OP_BINARY_OP;
|
|
uint16_t arg = BC_NOARG;
|
|
|
|
switch(self->op) {
|
|
case TK_ADD: arg = __add__ | (__radd__ << 8); break;
|
|
case TK_SUB: arg = __sub__ | (__rsub__ << 8); break;
|
|
case TK_MUL: arg = __mul__ | (__rmul__ << 8); break;
|
|
case TK_DIV: arg = __truediv__ | (__rtruediv__ << 8); break;
|
|
case TK_FLOORDIV: arg = __floordiv__ | (__rfloordiv__ << 8); break;
|
|
case TK_MOD: arg = __mod__ | (__rmod__ << 8); break;
|
|
case TK_POW: arg = __pow__ | (__rpow__ << 8); break;
|
|
|
|
case TK_LT: arg = __lt__ | (__gt__ << 8); break;
|
|
case TK_LE: arg = __le__ | (__ge__ << 8); break;
|
|
case TK_EQ: arg = __eq__ | (__eq__ << 8); break;
|
|
case TK_NE: arg = __ne__ | (__ne__ << 8); break;
|
|
case TK_GT: arg = __gt__ | (__lt__ << 8); break;
|
|
case TK_GE: arg = __ge__ | (__le__ << 8); break;
|
|
|
|
case TK_IN:
|
|
opcode = OP_CONTAINS_OP;
|
|
arg = 0;
|
|
break;
|
|
case TK_NOT_IN:
|
|
opcode = OP_CONTAINS_OP;
|
|
arg = 1;
|
|
break;
|
|
case TK_IS:
|
|
opcode = OP_IS_OP;
|
|
arg = 0;
|
|
break;
|
|
case TK_IS_NOT:
|
|
opcode = OP_IS_OP;
|
|
arg = 1;
|
|
break;
|
|
|
|
case TK_LSHIFT: arg = __lshift__; break;
|
|
case TK_RSHIFT: arg = __rshift__; break;
|
|
case TK_AND: arg = __and__; break;
|
|
case TK_OR: arg = __or__; break;
|
|
case TK_XOR: arg = __xor__; break;
|
|
case TK_DECORATOR: arg = __matmul__; break;
|
|
default: assert(false);
|
|
}
|
|
|
|
Ctx__emit_(ctx, opcode, arg, self->line);
|
|
|
|
for(int i = 0; i < jmps.count; i++) {
|
|
Ctx__patch_jump(ctx, c11__getitem(int, &jmps, i));
|
|
}
|
|
}
|
|
|
|
BinaryExpr* BinaryExpr__new(int line, TokenIndex op, bool inplace) {
|
|
const static ExprVt Vt = {.emit_ = BinaryExpr__emit_, .dtor = BinaryExpr__dtor};
|
|
static_assert_expr_size(BinaryExpr);
|
|
BinaryExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->lhs = NULL;
|
|
self->rhs = NULL;
|
|
self->op = op;
|
|
self->inplace = inplace;
|
|
return self;
|
|
}
|
|
|
|
typedef struct TernaryExpr {
|
|
EXPR_COMMON_HEADER
|
|
Expr* cond;
|
|
Expr* true_expr;
|
|
Expr* false_expr;
|
|
} TernaryExpr;
|
|
|
|
void TernaryExpr__dtor(Expr* self_) {
|
|
TernaryExpr* self = (TernaryExpr*)self_;
|
|
vtdelete(self->cond);
|
|
vtdelete(self->true_expr);
|
|
vtdelete(self->false_expr);
|
|
}
|
|
|
|
void TernaryExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
TernaryExpr* self = (TernaryExpr*)self_;
|
|
vtemit_(self->cond, ctx);
|
|
int patch = Ctx__emit_(ctx, OP_POP_JUMP_IF_FALSE, BC_NOARG, self->cond->line);
|
|
vtemit_(self->true_expr, ctx);
|
|
int patch_2 = Ctx__emit_(ctx, OP_JUMP_FORWARD, BC_NOARG, self->true_expr->line);
|
|
Ctx__patch_jump(ctx, patch);
|
|
vtemit_(self->false_expr, ctx);
|
|
Ctx__patch_jump(ctx, patch_2);
|
|
}
|
|
|
|
TernaryExpr* TernaryExpr__new(int line) {
|
|
const static ExprVt Vt = {.dtor = TernaryExpr__dtor, .emit_ = TernaryExpr__emit_};
|
|
static_assert_expr_size(TernaryExpr);
|
|
TernaryExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->cond = NULL;
|
|
self->true_expr = NULL;
|
|
self->false_expr = NULL;
|
|
return self;
|
|
}
|
|
|
|
typedef struct SubscrExpr {
|
|
EXPR_COMMON_HEADER
|
|
Expr* lhs;
|
|
Expr* rhs;
|
|
} SubscrExpr;
|
|
|
|
void SubscrExpr__dtor(Expr* self_) {
|
|
SubscrExpr* self = (SubscrExpr*)self_;
|
|
vtdelete(self->lhs);
|
|
vtdelete(self->rhs);
|
|
}
|
|
|
|
void SubscrExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
SubscrExpr* self = (SubscrExpr*)self_;
|
|
vtemit_(self->lhs, ctx);
|
|
vtemit_(self->rhs, ctx);
|
|
Ctx__emit_(ctx, OP_LOAD_SUBSCR, BC_NOARG, self->line);
|
|
}
|
|
|
|
bool SubscrExpr__emit_store(Expr* self_, Ctx* ctx) {
|
|
SubscrExpr* self = (SubscrExpr*)self_;
|
|
vtemit_(self->lhs, ctx);
|
|
vtemit_(self->rhs, ctx);
|
|
Ctx__emit_(ctx, OP_STORE_SUBSCR, BC_NOARG, self->line);
|
|
return true;
|
|
}
|
|
|
|
void SubscrExpr__emit_inplace(Expr* self_, Ctx* ctx) {
|
|
SubscrExpr* self = (SubscrExpr*)self_;
|
|
vtemit_(self->lhs, ctx);
|
|
vtemit_(self->rhs, ctx);
|
|
Ctx__emit_(ctx, OP_DUP_TOP_TWO, BC_NOARG, self->line);
|
|
Ctx__emit_(ctx, OP_LOAD_SUBSCR, BC_NOARG, self->line);
|
|
}
|
|
|
|
bool SubscrExpr__emit_istore(Expr* self_, Ctx* ctx) {
|
|
SubscrExpr* self = (SubscrExpr*)self_;
|
|
// [a, b, val] -> [val, a, b]
|
|
Ctx__emit_(ctx, OP_ROT_THREE, BC_NOARG, self->line);
|
|
Ctx__emit_(ctx, OP_STORE_SUBSCR, BC_NOARG, self->line);
|
|
return true;
|
|
}
|
|
|
|
bool SubscrExpr__emit_del(Expr* self_, Ctx* ctx) {
|
|
SubscrExpr* self = (SubscrExpr*)self_;
|
|
vtemit_(self->lhs, ctx);
|
|
vtemit_(self->rhs, ctx);
|
|
Ctx__emit_(ctx, OP_DELETE_SUBSCR, BC_NOARG, self->line);
|
|
return true;
|
|
}
|
|
|
|
SubscrExpr* SubscrExpr__new(int line) {
|
|
const static ExprVt Vt = {
|
|
.dtor = SubscrExpr__dtor,
|
|
.emit_ = SubscrExpr__emit_,
|
|
.emit_store = SubscrExpr__emit_store,
|
|
.emit_inplace = SubscrExpr__emit_inplace,
|
|
.emit_istore = SubscrExpr__emit_istore,
|
|
.emit_del = SubscrExpr__emit_del,
|
|
.is_subscr = true,
|
|
};
|
|
static_assert_expr_size(SubscrExpr);
|
|
SubscrExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->lhs = NULL;
|
|
self->rhs = NULL;
|
|
return self;
|
|
}
|
|
|
|
typedef struct AttribExpr {
|
|
EXPR_COMMON_HEADER
|
|
Expr* child;
|
|
py_Name name;
|
|
} AttribExpr;
|
|
|
|
void AttribExpr__dtor(Expr* self_) {
|
|
AttribExpr* self = (AttribExpr*)self_;
|
|
vtdelete(self->child);
|
|
}
|
|
|
|
void AttribExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
AttribExpr* self = (AttribExpr*)self_;
|
|
vtemit_(self->child, ctx);
|
|
Ctx__emit_(ctx, OP_LOAD_ATTR, self->name, self->line);
|
|
}
|
|
|
|
bool AttribExpr__emit_del(Expr* self_, Ctx* ctx) {
|
|
AttribExpr* self = (AttribExpr*)self_;
|
|
vtemit_(self->child, ctx);
|
|
Ctx__emit_(ctx, OP_DELETE_ATTR, self->name, self->line);
|
|
return true;
|
|
}
|
|
|
|
bool AttribExpr__emit_store(Expr* self_, Ctx* ctx) {
|
|
AttribExpr* self = (AttribExpr*)self_;
|
|
vtemit_(self->child, ctx);
|
|
Ctx__emit_(ctx, OP_STORE_ATTR, BC_NOARG, self->line);
|
|
return true;
|
|
}
|
|
|
|
void AttribExpr__emit_inplace(Expr* self_, Ctx* ctx) {
|
|
AttribExpr* self = (AttribExpr*)self_;
|
|
vtemit_(self->child, ctx);
|
|
Ctx__emit_(ctx, OP_DUP_TOP, BC_NOARG, self->line);
|
|
Ctx__emit_(ctx, OP_LOAD_ATTR, self->name, self->line);
|
|
}
|
|
|
|
bool AttribExpr__emit_istore(Expr* self_, Ctx* ctx) {
|
|
// [a, val] -> [val, a]
|
|
AttribExpr* self = (AttribExpr*)self_;
|
|
Ctx__emit_(ctx, OP_ROT_TWO, BC_NOARG, self->line);
|
|
Ctx__emit_(ctx, OP_STORE_ATTR, self->name, self->line);
|
|
return true;
|
|
}
|
|
|
|
AttribExpr* AttribExpr__new(int line, Expr* child, py_Name name) {
|
|
const static ExprVt Vt = {.emit_ = AttribExpr__emit_,
|
|
.emit_del = AttribExpr__emit_del,
|
|
.emit_store = AttribExpr__emit_store,
|
|
.emit_inplace = AttribExpr__emit_inplace,
|
|
.emit_istore = AttribExpr__emit_istore,
|
|
.dtor = AttribExpr__dtor,
|
|
.is_attrib = true};
|
|
static_assert_expr_size(AttribExpr);
|
|
AttribExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->child = child;
|
|
self->name = name;
|
|
return self;
|
|
}
|
|
|
|
typedef struct CallExprKwArg {
|
|
py_Name key;
|
|
Expr* val;
|
|
} CallExprKwArg;
|
|
|
|
typedef struct CallExpr {
|
|
EXPR_COMMON_HEADER
|
|
Expr* callable;
|
|
c11_vector /*T=Expr* */ args;
|
|
// **a will be interpreted as a special keyword argument: {{0}: a}
|
|
c11_vector /*T=CallExprKwArg */ kwargs;
|
|
} CallExpr;
|
|
|
|
void CallExpr__dtor(Expr* self_) {
|
|
CallExpr* self = (CallExpr*)self_;
|
|
vtdelete(self->callable);
|
|
c11__foreach(Expr*, &self->args, e) vtdelete(*e);
|
|
c11__foreach(CallExprKwArg, &self->kwargs, e) vtdelete(e->val);
|
|
c11_vector__dtor(&self->args);
|
|
c11_vector__dtor(&self->kwargs);
|
|
}
|
|
|
|
void CallExpr__emit_(Expr* self_, Ctx* ctx) {
|
|
CallExpr* self = (CallExpr*)self_;
|
|
|
|
bool vargs = false; // whether there is *args as input
|
|
bool vkwargs = false; // whether there is **kwargs as input
|
|
c11__foreach(Expr*, &self->args, e) {
|
|
if((*e)->vt->is_starred) vargs = true;
|
|
}
|
|
c11__foreach(CallExprKwArg, &self->kwargs, e) {
|
|
if(e->val->vt->is_starred) vkwargs = true;
|
|
}
|
|
|
|
// if callable is a AttrExpr, we should try to use `fast_call` instead of use `boundmethod`
|
|
if(self->callable->vt->is_attrib) {
|
|
AttribExpr* p = (AttribExpr*)self->callable;
|
|
vtemit_(p->child, ctx);
|
|
Ctx__emit_(ctx, OP_LOAD_METHOD, p->name, p->line);
|
|
} else {
|
|
vtemit_(self->callable, ctx);
|
|
Ctx__emit_(ctx, OP_LOAD_NULL, BC_NOARG, BC_KEEPLINE);
|
|
}
|
|
|
|
Opcode opcode = OP_CALL;
|
|
if(vargs || vkwargs) {
|
|
// in this case, there is at least one *args or **kwargs as StarredExpr
|
|
// OP_CALL_VARGS needs to unpack them via __vectorcall_buffer
|
|
opcode = OP_CALL_VARGS;
|
|
}
|
|
|
|
c11__foreach(Expr*, &self->args, e) { vtemit_(*e, ctx); }
|
|
c11__foreach(CallExprKwArg, &self->kwargs, e) {
|
|
Ctx__emit_int(ctx, e->key, self->line);
|
|
vtemit_(e->val, ctx);
|
|
}
|
|
int KWARGC = self->kwargs.count;
|
|
int ARGC = self->args.count;
|
|
assert(KWARGC < 256 && ARGC < 256);
|
|
Ctx__emit_(ctx, opcode, (KWARGC << 8) | ARGC, self->line);
|
|
}
|
|
|
|
CallExpr* CallExpr__new(int line, Expr* callable) {
|
|
const static ExprVt Vt = {.dtor = CallExpr__dtor, .emit_ = CallExpr__emit_};
|
|
static_assert_expr_size(CallExpr);
|
|
CallExpr* self = PoolExpr_alloc();
|
|
self->vt = &Vt;
|
|
self->line = line;
|
|
self->callable = callable;
|
|
c11_vector__ctor(&self->args, sizeof(Expr*));
|
|
c11_vector__ctor(&self->kwargs, sizeof(CallExprKwArg));
|
|
return self;
|
|
}
|
|
|
|
/* context.c */
|
|
static void Ctx__ctor(Ctx* self, CodeObject* co, FuncDecl* func, int level) {
|
|
self->co = co;
|
|
self->func = func;
|
|
self->level = level;
|
|
self->curr_iblock = 0;
|
|
self->is_compiling_class = false;
|
|
c11_vector__ctor(&self->s_expr, sizeof(Expr*));
|
|
c11_smallmap_n2i__ctor(&self->global_names);
|
|
c11_smallmap_s2n__ctor(&self->co_consts_string_dedup_map);
|
|
}
|
|
|
|
static void Ctx__dtor(Ctx* self) {
|
|
// clean the expr stack
|
|
for(int i = 0; i < self->s_expr.count; i++) {
|
|
vtdelete(c11__getitem(Expr*, &self->s_expr, i));
|
|
}
|
|
c11_vector__dtor(&self->s_expr);
|
|
c11_smallmap_n2i__dtor(&self->global_names);
|
|
c11_smallmap_s2n__dtor(&self->co_consts_string_dedup_map);
|
|
}
|
|
|
|
static bool is_small_int(int64_t value) { return value >= INT16_MIN && value <= INT16_MAX; }
|
|
|
|
static int Ctx__get_loop(Ctx* self) {
|
|
int index = self->curr_iblock;
|
|
while(index >= 0) {
|
|
CodeBlock* block = c11__at(CodeBlock, &self->co->blocks, index);
|
|
if(block->type == CodeBlockType_FOR_LOOP) break;
|
|
if(block->type == CodeBlockType_WHILE_LOOP) break;
|
|
index = block->parent;
|
|
}
|
|
return index;
|
|
}
|
|
|
|
static CodeBlock* Ctx__enter_block(Ctx* self, CodeBlockType type) {
|
|
CodeBlock block = {type, self->curr_iblock, self->co->codes.count, -1, -1};
|
|
c11_vector__push(CodeBlock, &self->co->blocks, block);
|
|
self->curr_iblock = self->co->blocks.count - 1;
|
|
return c11__at(CodeBlock, &self->co->blocks, self->curr_iblock);
|
|
}
|
|
|
|
static void Ctx__exit_block(Ctx* self) {
|
|
CodeBlock* block = c11__at(CodeBlock, &self->co->blocks, self->curr_iblock);
|
|
CodeBlockType curr_type = block->type;
|
|
block->end = self->co->codes.count;
|
|
self->curr_iblock = block->parent;
|
|
assert(self->curr_iblock >= 0);
|
|
if(curr_type == CodeBlockType_FOR_LOOP) {
|
|
// add a no op here to make block check work
|
|
Ctx__emit_virtual(self, OP_NO_OP, BC_NOARG, BC_KEEPLINE, true);
|
|
}
|
|
}
|
|
|
|
static void Ctx__s_emit_decorators(Ctx* self, int count) {
|
|
assert(Ctx__s_size(self) >= count);
|
|
// [obj]
|
|
for(int i = 0; i < count; i++) {
|
|
Expr* deco = Ctx__s_popx(self);
|
|
vtemit_(deco, self); // [obj, f]
|
|
Ctx__emit_(self, OP_ROT_TWO, BC_NOARG, deco->line); // [f, obj]
|
|
Ctx__emit_(self, OP_LOAD_NULL, BC_NOARG, BC_KEEPLINE); // [f, obj, NULL]
|
|
Ctx__emit_(self, OP_ROT_TWO, BC_NOARG, BC_KEEPLINE); // [obj, NULL, f]
|
|
Ctx__emit_(self, OP_CALL, 1, deco->line); // [obj]
|
|
vtdelete(deco);
|
|
}
|
|
}
|
|
|
|
static int Ctx__emit_virtual(Ctx* self, Opcode opcode, uint16_t arg, int line, bool is_virtual) {
|
|
Bytecode bc = {(uint8_t)opcode, arg};
|
|
BytecodeEx bcx = {line, is_virtual, self->curr_iblock};
|
|
c11_vector__push(Bytecode, &self->co->codes, bc);
|
|
c11_vector__push(BytecodeEx, &self->co->codes_ex, bcx);
|
|
int i = self->co->codes.count - 1;
|
|
BytecodeEx* codes_ex = (BytecodeEx*)self->co->codes_ex.data;
|
|
if(line == BC_KEEPLINE) { codes_ex[i].lineno = i >= 1 ? codes_ex[i - 1].lineno : 1; }
|
|
return i;
|
|
}
|
|
|
|
static int Ctx__emit_(Ctx* self, Opcode opcode, uint16_t arg, int line) {
|
|
return Ctx__emit_virtual(self, opcode, arg, line, false);
|
|
}
|
|
|
|
static void Ctx__revert_last_emit_(Ctx* self) {
|
|
c11_vector__pop(&self->co->codes);
|
|
c11_vector__pop(&self->co->codes_ex);
|
|
}
|
|
|
|
static void Ctx__try_merge_for_iter_store(Ctx* self, int i) {
|
|
// [FOR_ITER, STORE_?, ]
|
|
Bytecode* co_codes = (Bytecode*)self->co->codes.data;
|
|
if(co_codes[i].op != OP_FOR_ITER) return;
|
|
if(self->co->codes.count - i != 2) return;
|
|
uint16_t arg = co_codes[i + 1].arg;
|
|
if(co_codes[i + 1].op == OP_STORE_FAST) {
|
|
Ctx__revert_last_emit_(self);
|
|
co_codes[i].op = OP_FOR_ITER_STORE_FAST;
|
|
co_codes[i].arg = arg;
|
|
return;
|
|
}
|
|
if(co_codes[i + 1].op == OP_STORE_GLOBAL) {
|
|
Ctx__revert_last_emit_(self);
|
|
co_codes[i].op = OP_FOR_ITER_STORE_GLOBAL;
|
|
co_codes[i].arg = arg;
|
|
return;
|
|
}
|
|
}
|
|
|
|
static int Ctx__emit_int(Ctx* self, int64_t value, int line) {
|
|
if(is_small_int(value)) {
|
|
return Ctx__emit_(self, OP_LOAD_SMALL_INT, (uint16_t)value, line);
|
|
} else {
|
|
py_TValue tmp;
|
|
py_newint(&tmp, value);
|
|
return Ctx__emit_(self, OP_LOAD_CONST, Ctx__add_const(self, &tmp), line);
|
|
}
|
|
}
|
|
|
|
static void Ctx__patch_jump(Ctx* self, int index) {
|
|
Bytecode* co_codes = (Bytecode*)self->co->codes.data;
|
|
int target = self->co->codes.count;
|
|
Bytecode__set_signed_arg(&co_codes[index], target - index);
|
|
}
|
|
|
|
static bool Ctx__add_label(Ctx* self, py_Name name) {
|
|
bool ok = c11_smallmap_n2i__contains(&self->co->labels, name);
|
|
if(ok) return false;
|
|
c11_smallmap_n2i__set(&self->co->labels, name, self->co->codes.count);
|
|
return true;
|
|
}
|
|
|
|
static int Ctx__add_varname(Ctx* self, py_Name name) {
|
|
// PK_MAX_CO_VARNAMES will be checked when pop_context(), not here
|
|
int index = c11_smallmap_n2i__get(&self->co->varnames_inv, name, -1);
|
|
if(index >= 0) return index;
|
|
c11_vector__push(uint16_t, &self->co->varnames, name);
|
|
self->co->nlocals++;
|
|
index = self->co->varnames.count - 1;
|
|
c11_smallmap_n2i__set(&self->co->varnames_inv, name, index);
|
|
return index;
|
|
}
|
|
|
|
static int Ctx__add_const_string(Ctx* self, c11_sv key) {
|
|
uint16_t* val = c11_smallmap_s2n__try_get(&self->co_consts_string_dedup_map, key);
|
|
if(val) {
|
|
return *val;
|
|
} else {
|
|
py_TValue tmp;
|
|
py_newstrn(&tmp, key.data, key.size);
|
|
c11_vector__push(py_TValue, &self->co->consts, tmp);
|
|
int index = self->co->consts.count - 1;
|
|
c11_smallmap_s2n__set(&self->co_consts_string_dedup_map,
|
|
c11_string__sv(PyObject__userdata(tmp._obj)),
|
|
index);
|
|
return index;
|
|
}
|
|
}
|
|
|
|
static int Ctx__add_const(Ctx* self, py_Ref v) {
|
|
assert(v->type != tp_str);
|
|
c11_vector__push(py_TValue, &self->co->consts, *v);
|
|
return self->co->consts.count - 1;
|
|
}
|
|
|
|
static void Ctx__emit_store_name(Ctx* self, NameScope scope, py_Name name, int line) {
|
|
switch(scope) {
|
|
case NAME_LOCAL: Ctx__emit_(self, OP_STORE_FAST, Ctx__add_varname(self, name), line); break;
|
|
case NAME_GLOBAL: Ctx__emit_(self, OP_STORE_GLOBAL, name, line); break;
|
|
case NAME_GLOBAL_UNKNOWN: Ctx__emit_(self, OP_STORE_NAME, name, line); break;
|
|
default: c11__unreachedable();
|
|
}
|
|
}
|
|
|
|
// emit top -> pop -> delete
|
|
static void Ctx__s_emit_top(Ctx* self) {
|
|
Expr* top = c11_vector__back(Expr*, &self->s_expr);
|
|
vtemit_(top, self);
|
|
vtdelete(top);
|
|
c11_vector__pop(&self->s_expr);
|
|
}
|
|
|
|
// push
|
|
static void Ctx__s_push(Ctx* self, Expr* expr) { c11_vector__push(Expr*, &self->s_expr, expr); }
|
|
|
|
// top
|
|
static Expr* Ctx__s_top(Ctx* self) { return c11_vector__back(Expr*, &self->s_expr); }
|
|
|
|
// size
|
|
static int Ctx__s_size(Ctx* self) { return self->s_expr.count; }
|
|
|
|
// pop -> delete
|
|
static void Ctx__s_pop(Ctx* self) {
|
|
Expr* top = c11_vector__back(Expr*, &self->s_expr);
|
|
vtdelete(top);
|
|
c11_vector__pop(&self->s_expr);
|
|
}
|
|
|
|
// pop move
|
|
static Expr* Ctx__s_popx(Ctx* self) {
|
|
Expr* top = c11_vector__back(Expr*, &self->s_expr);
|
|
c11_vector__pop(&self->s_expr);
|
|
return top;
|
|
}
|
|
|
|
/* compiler.c */
|
|
typedef struct Compiler Compiler;
|
|
typedef Error* (*PrattCallback)(Compiler* self);
|
|
|
|
typedef struct PrattRule {
|
|
PrattCallback prefix;
|
|
PrattCallback infix;
|
|
enum Precedence precedence;
|
|
} PrattRule;
|
|
|
|
const static PrattRule rules[TK__COUNT__];
|
|
|
|
typedef struct Compiler {
|
|
pk_SourceData_ src; // weakref
|
|
pk_TokenArray tokens;
|
|
int i;
|
|
c11_vector /*T=CodeEmitContext*/ contexts;
|
|
} Compiler;
|
|
|
|
static void Compiler__ctor(Compiler* self, pk_SourceData_ src, pk_TokenArray tokens) {
|
|
self->src = src;
|
|
self->tokens = tokens;
|
|
self->i = 0;
|
|
c11_vector__ctor(&self->contexts, sizeof(Ctx));
|
|
}
|
|
|
|
static void Compiler__dtor(Compiler* self) {
|
|
pk_TokenArray__dtor(&self->tokens);
|
|
c11_vector__dtor(&self->contexts);
|
|
}
|
|
|
|
/**************************************/
|
|
#define tk(i) c11__at(Token, &self->tokens, i)
|
|
#define prev() tk(self->i - 1)
|
|
#define curr() tk(self->i)
|
|
#define next() tk(self->i + 1)
|
|
// #define err() (self->i == self->tokens.count ? prev() : curr())
|
|
|
|
#define advance() self->i++
|
|
#define mode() self->src->mode
|
|
#define ctx() (&c11_vector__back(Ctx, &self->contexts))
|
|
|
|
#define match_newlines() match_newlines_repl(self, NULL)
|
|
|
|
#define consume(expected) \
|
|
if(!match(expected)) \
|
|
return SyntaxError("expected '%s', got '%s'", \
|
|
pk_TokenSymbols[expected], \
|
|
pk_TokenSymbols[curr()->type]);
|
|
#define consume_end_stmt() \
|
|
if(!match_end_stmt(self)) return SyntaxError("expected statement end")
|
|
#define check_newlines_repl() \
|
|
do { \
|
|
bool __nml; \
|
|
match_newlines_repl(self, &__nml); \
|
|
if(__nml) return NeedMoreLines(); \
|
|
} while(0)
|
|
#define check(B) \
|
|
if((err = B)) return err
|
|
|
|
static NameScope name_scope(Compiler* self) {
|
|
NameScope s = self->contexts.count > 1 ? NAME_LOCAL : NAME_GLOBAL;
|
|
if(self->src->is_dynamic && s == NAME_GLOBAL) s = NAME_GLOBAL_UNKNOWN;
|
|
return s;
|
|
}
|
|
|
|
#define SyntaxError(...) NULL
|
|
|
|
static Error* NeedMoreLines() { return NULL; }
|
|
|
|
/* Matchers */
|
|
static bool is_expression(Compiler* self, bool allow_slice) {
|
|
PrattCallback prefix = rules[curr()->type].prefix;
|
|
return prefix && (allow_slice || curr()->type != TK_COLON);
|
|
}
|
|
|
|
#define match(expected) (curr()->type == expected ? (++self->i) : 0)
|
|
|
|
static bool match_newlines_repl(Compiler* self, bool* need_more_lines) {
|
|
bool consumed = false;
|
|
if(curr()->type == TK_EOL) {
|
|
while(curr()->type == TK_EOL)
|
|
advance();
|
|
consumed = true;
|
|
}
|
|
if(need_more_lines) { *need_more_lines = (mode() == REPL_MODE && curr()->type == TK_EOF); }
|
|
return consumed;
|
|
}
|
|
|
|
static bool match_end_stmt(Compiler* self) {
|
|
if(match(TK_SEMICOLON)) {
|
|
match_newlines();
|
|
return true;
|
|
}
|
|
if(match_newlines() || curr()->type == TK_EOF) return true;
|
|
if(curr()->type == TK_DEDENT) return true;
|
|
return false;
|
|
}
|
|
|
|
/* Expression */
|
|
|
|
/// Parse an expression and push it onto the stack.
|
|
static Error* parse_expression(Compiler* self, int precedence, bool allow_slice) {
|
|
PrattCallback prefix = rules[curr()->type].prefix;
|
|
if(!prefix || (curr()->type == TK_COLON && !allow_slice)) {
|
|
return SyntaxError("expected an expression, got %s", pk_TokenSymbols[curr()->type]);
|
|
}
|
|
advance();
|
|
Error* err;
|
|
check(prefix(self));
|
|
while(rules[curr()->type].precedence >= precedence &&
|
|
(allow_slice || curr()->type != TK_COLON)) {
|
|
TokenIndex op = curr()->type;
|
|
advance();
|
|
PrattCallback infix = rules[op].infix;
|
|
assert(infix != NULL);
|
|
check(infix(self));
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
static Error* EXPR_TUPLE_ALLOW_SLICE(Compiler* self, bool allow_slice) {
|
|
Error* err;
|
|
check(parse_expression(self, PREC_LOWEST + 1, allow_slice));
|
|
if(!match(TK_COMMA)) return NULL;
|
|
// tuple expression // (a, )
|
|
int count = 1;
|
|
do {
|
|
if(curr()->brackets_level) check_newlines_repl();
|
|
if(!is_expression(self, allow_slice)) break;
|
|
check(parse_expression(self, PREC_LOWEST + 1, allow_slice));
|
|
count += 1;
|
|
if(curr()->brackets_level) check_newlines_repl();
|
|
} while(match(TK_COMMA));
|
|
// pop `count` expressions from the stack and merge them into a TupleExpr
|
|
SequenceExpr* e = TupleExpr__new(prev()->line, count);
|
|
for(int i = count - 1; i >= 0; i--) {
|
|
Expr* item = Ctx__s_popx(ctx());
|
|
c11__setitem(Expr*, &e->items, i, item);
|
|
}
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
/// Parse a simple expression.
|
|
static Error* EXPR(Compiler* self) { return parse_expression(self, PREC_LOWEST + 1, false); }
|
|
|
|
/// Parse a simple expression or a tuple of expressions.
|
|
static Error* EXPR_TUPLE(Compiler* self) { return EXPR_TUPLE_ALLOW_SLICE(self, false); }
|
|
|
|
// special case for `for loop` and `comp`
|
|
static Error* EXPR_VARS(Compiler* self) {
|
|
// int count = 0;
|
|
// do {
|
|
// consume(TK_ID);
|
|
// ctx()->s_push(make_expr<NameExpr>(prev().str(), name_scope()));
|
|
// count += 1;
|
|
// } while(match(TK_COMMA));
|
|
// if(count > 1){
|
|
// TupleExpr* e = make_expr<TupleExpr>(count);
|
|
// for(int i=count-1; i>=0; i--)
|
|
// e->items[i] = Ctx__s_popx(ctx());
|
|
// ctx()->s_push(e);
|
|
// }
|
|
return NULL;
|
|
}
|
|
|
|
/* Misc */
|
|
static void push_global_context(Compiler* self, CodeObject* co) {
|
|
co->start_line = self->i == 0 ? 1 : prev()->line;
|
|
Ctx* ctx = c11_vector__emplace(&self->contexts);
|
|
Ctx__ctor(ctx, co, NULL, self->contexts.count);
|
|
}
|
|
|
|
static Error* pop_context(Compiler* self) {
|
|
// add a `return None` in the end as a guard
|
|
// previously, we only do this if the last opcode is not a return
|
|
// however, this is buggy...since there may be a jump to the end (out of bound) even if the last
|
|
// opcode is a return
|
|
Ctx__emit_virtual(ctx(), OP_RETURN_VALUE, 1, BC_KEEPLINE, true);
|
|
|
|
CodeObject* co = ctx()->co;
|
|
// find the last valid token
|
|
int j = self->i - 1;
|
|
while(tk(j)->type == TK_EOL || tk(j)->type == TK_DEDENT || tk(j)->type == TK_EOF)
|
|
j--;
|
|
co->end_line = tk(j)->line;
|
|
|
|
// some check here
|
|
c11_vector* codes = &co->codes;
|
|
if(co->nlocals > PK_MAX_CO_VARNAMES) {
|
|
return SyntaxError("maximum number of local variables exceeded");
|
|
}
|
|
if(co->consts.count > 65530) { return SyntaxError("maximum number of constants exceeded"); }
|
|
// pre-compute LOOP_BREAK and LOOP_CONTINUE
|
|
for(int i = 0; i < codes->count; i++) {
|
|
Bytecode* bc = c11__at(Bytecode, codes, i);
|
|
if(bc->op == OP_LOOP_CONTINUE) {
|
|
CodeBlock* block = c11__at(CodeBlock, &ctx()->co->blocks, bc->arg);
|
|
Bytecode__set_signed_arg(bc, block->start - i);
|
|
} else if(bc->op == OP_LOOP_BREAK) {
|
|
CodeBlock* block = c11__at(CodeBlock, &ctx()->co->blocks, bc->arg);
|
|
Bytecode__set_signed_arg(bc, (block->end2 != -1 ? block->end2 : block->end) - i);
|
|
}
|
|
}
|
|
// pre-compute func->is_simple
|
|
FuncDecl* func = ctx()->func;
|
|
if(func) {
|
|
// check generator
|
|
c11__foreach(Bytecode, &func->code.codes, bc) {
|
|
if(bc->op == OP_YIELD_VALUE || bc->op == OP_FOR_ITER_YIELD_VALUE) {
|
|
func->type = FuncType_GENERATOR;
|
|
c11__foreach(Bytecode, &func->code.codes, bc) {
|
|
if(bc->op == OP_RETURN_VALUE && bc->arg == BC_NOARG) {
|
|
return SyntaxError("'return' with argument inside generator function");
|
|
}
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
if(func->type == FuncType_UNSET) {
|
|
bool is_simple = true;
|
|
if(func->kwargs.count > 0) is_simple = false;
|
|
if(func->starred_arg >= 0) is_simple = false;
|
|
if(func->starred_kwarg >= 0) is_simple = false;
|
|
|
|
if(is_simple) {
|
|
func->type = FuncType_SIMPLE;
|
|
|
|
bool is_empty = false;
|
|
if(func->code.codes.count == 1) {
|
|
Bytecode bc = c11__getitem(Bytecode, &func->code.codes, 0);
|
|
if(bc.op == OP_RETURN_VALUE && bc.arg == 1) { is_empty = true; }
|
|
}
|
|
if(is_empty) func->type = FuncType_EMPTY;
|
|
} else
|
|
func->type = FuncType_NORMAL;
|
|
}
|
|
|
|
assert(func->type != FuncType_UNSET);
|
|
}
|
|
Ctx__dtor(ctx());
|
|
c11_vector__pop(&self->contexts);
|
|
return NULL;
|
|
}
|
|
|
|
/* Expression Callbacks */
|
|
static Error* exprLiteral(Compiler* self) {
|
|
LiteralExpr* e = LiteralExpr__new(prev()->line, &prev()->value);
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprLong(Compiler* self) {
|
|
c11_sv sv = Token__sv(prev());
|
|
Ctx__s_push(ctx(), (Expr*)RawStringExpr__new(prev()->line, sv, OP_BUILD_LONG));
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprBytes(Compiler* self) {
|
|
c11_sv sv = c11_string__sv(prev()->value._str);
|
|
Ctx__s_push(ctx(), (Expr*)RawStringExpr__new(prev()->line, sv, OP_BUILD_BYTES));
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprFString(Compiler* self) {
|
|
c11_sv sv = c11_string__sv(prev()->value._str);
|
|
Ctx__s_push(ctx(), (Expr*)FStringExpr__new(prev()->line, sv));
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprImag(Compiler* self) {
|
|
Ctx__s_push(ctx(), (Expr*)ImagExpr__new(prev()->line, prev()->value._f64));
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprLambda(Compiler* self) {
|
|
assert(false);
|
|
return NULL;
|
|
// Error* err;
|
|
// int line = prev()->line;
|
|
// int decl_index;
|
|
// FuncDecl_ decl = push_f_context({"<lambda>", 8}, &decl_index);
|
|
// if(!match(TK_COLON)) {
|
|
// check(_compile_f_args(decl, false));
|
|
// consume(TK_COLON);
|
|
// }
|
|
// // https://github.com/pocketpy/pocketpy/issues/37
|
|
// check(parse_expression(self, PREC_LAMBDA + 1, false));
|
|
// Ctx__s_emit_top(ctx());
|
|
// Ctx__emit_(ctx(), OP_RETURN_VALUE, BC_NOARG, BC_KEEPLINE);
|
|
// check(pop_context(self));
|
|
// LambdaExpr* e = LambdaExpr__new(line, decl_index);
|
|
// Ctx__s_push(ctx(), (Expr*)e);
|
|
// return NULL;
|
|
}
|
|
|
|
static Error* exprOr(Compiler* self) {
|
|
Error* err;
|
|
int line = prev()->line;
|
|
check(parse_expression(self, PREC_LOGICAL_OR + 1, false));
|
|
LogicBinaryExpr* e = LogicBinaryExpr__new(line, OP_JUMP_IF_TRUE_OR_POP);
|
|
e->rhs = Ctx__s_popx(ctx());
|
|
e->lhs = Ctx__s_popx(ctx());
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprAnd(Compiler* self) {
|
|
Error* err;
|
|
int line = prev()->line;
|
|
check(parse_expression(self, PREC_LOGICAL_AND + 1, false));
|
|
LogicBinaryExpr* e = LogicBinaryExpr__new(line, OP_JUMP_IF_FALSE_OR_POP);
|
|
e->rhs = Ctx__s_popx(ctx());
|
|
e->lhs = Ctx__s_popx(ctx());
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprTernary(Compiler* self) {
|
|
// [true_expr]
|
|
Error* err;
|
|
int line = prev()->line;
|
|
check(parse_expression(self, PREC_TERNARY + 1, false)); // [true_expr, cond]
|
|
consume(TK_ELSE);
|
|
check(parse_expression(self, PREC_TERNARY + 1, false)); // [true_expr, cond, false_expr]
|
|
TernaryExpr* e = TernaryExpr__new(line);
|
|
e->false_expr = Ctx__s_popx(ctx());
|
|
e->cond = Ctx__s_popx(ctx());
|
|
e->true_expr = Ctx__s_popx(ctx());
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprBinaryOp(Compiler* self) {
|
|
Error* err;
|
|
int line = prev()->line;
|
|
TokenIndex op = prev()->type;
|
|
check(parse_expression(self, rules[op].precedence + 1, false));
|
|
BinaryExpr* e = BinaryExpr__new(line, op, false);
|
|
if(op == TK_IN || op == TK_NOT_IN) {
|
|
e->lhs = Ctx__s_popx(ctx());
|
|
e->rhs = Ctx__s_popx(ctx());
|
|
} else {
|
|
e->rhs = Ctx__s_popx(ctx());
|
|
e->lhs = Ctx__s_popx(ctx());
|
|
}
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprNot(Compiler* self) {
|
|
Error* err;
|
|
int line = prev()->line;
|
|
check(parse_expression(self, PREC_LOGICAL_NOT + 1, false));
|
|
UnaryExpr* e = UnaryExpr__new(line, Ctx__s_popx(ctx()), OP_UNARY_NOT);
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprUnaryOp(Compiler* self) {
|
|
Error* err;
|
|
int line = prev()->line;
|
|
TokenIndex op = prev()->type;
|
|
check(parse_expression(self, PREC_UNARY + 1, false));
|
|
Expr* e = Ctx__s_popx(ctx());
|
|
switch(op) {
|
|
case TK_SUB: Ctx__s_push(ctx(), (Expr*)UnaryExpr__new(line, e, OP_UNARY_NEGATIVE)); break;
|
|
case TK_INVERT: Ctx__s_push(ctx(), (Expr*)UnaryExpr__new(line, e, OP_UNARY_INVERT)); break;
|
|
case TK_MUL: Ctx__s_push(ctx(), (Expr*)StarredExpr__new(line, e, 1)); break;
|
|
case TK_POW: Ctx__s_push(ctx(), (Expr*)StarredExpr__new(line, e, 2)); break;
|
|
default: assert(false);
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprGroup(Compiler* self) {
|
|
Error* err;
|
|
int line = prev()->line;
|
|
check_newlines_repl();
|
|
check(EXPR_TUPLE(self)); // () is just for change precedence
|
|
check_newlines_repl();
|
|
consume(TK_RPAREN);
|
|
if(Ctx__s_top(ctx())->vt->is_tuple) return NULL;
|
|
GroupedExpr* g = GroupedExpr__new(line, Ctx__s_popx(ctx()));
|
|
Ctx__s_push(ctx(), (Expr*)g);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprName(Compiler* self) {
|
|
py_Name name = py_name2(Token__sv(prev()));
|
|
NameScope scope = name_scope(self);
|
|
// promote this name to global scope if needed
|
|
if(c11_smallmap_n2i__contains(&ctx()->global_names, name)) { scope = NAME_GLOBAL; }
|
|
NameExpr* e = NameExpr__new(prev()->line, name, scope);
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprAttrib(Compiler* self) {
|
|
consume(TK_ID);
|
|
py_Name name = py_name2(Token__sv(prev()));
|
|
AttribExpr* e = AttribExpr__new(prev()->line, Ctx__s_popx(ctx()), name);
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprLiteral0(Compiler* self) {
|
|
Literal0Expr* e = Literal0Expr__new(prev()->line, prev()->type);
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* consume_comp(Compiler* self, Opcode op0, Opcode op1) {
|
|
// [expr]
|
|
Error* err;
|
|
int line = prev()->line;
|
|
bool has_cond = false;
|
|
check(EXPR_VARS(self)); // [expr, vars]
|
|
consume(TK_IN);
|
|
check(parse_expression(self, PREC_TERNARY + 1, false)); // [expr, vars, iter]
|
|
check_newlines_repl();
|
|
if(match(TK_IF)) {
|
|
check(parse_expression(self, PREC_TERNARY + 1, false)); // [expr, vars, iter, cond]
|
|
has_cond = true;
|
|
}
|
|
CompExpr* ce = CompExpr__new(line, op0, op1);
|
|
if(has_cond) ce->cond = Ctx__s_popx(ctx());
|
|
ce->iter = Ctx__s_popx(ctx());
|
|
ce->vars = Ctx__s_popx(ctx());
|
|
ce->expr = Ctx__s_popx(ctx());
|
|
Ctx__s_push(ctx(), (Expr*)ce);
|
|
check_newlines_repl();
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprList(Compiler* self) {
|
|
Error* err;
|
|
int line = prev()->line;
|
|
int count = 0;
|
|
do {
|
|
check_newlines_repl();
|
|
if(curr()->type == TK_RBRACKET) break;
|
|
check(EXPR(self));
|
|
count += 1;
|
|
check_newlines_repl();
|
|
if(count == 1 && match(TK_FOR)) {
|
|
check(consume_comp(self, OP_BUILD_LIST, OP_LIST_APPEND));
|
|
consume(TK_RBRACKET);
|
|
return NULL;
|
|
}
|
|
check_newlines_repl();
|
|
} while(match(TK_COMMA));
|
|
consume(TK_RBRACKET);
|
|
SequenceExpr* e = ListExpr__new(line, count);
|
|
for(int i = count - 1; i >= 0; i--) {
|
|
c11__setitem(Expr*, &e->items, i, Ctx__s_popx(ctx()));
|
|
}
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprMap(Compiler* self) {
|
|
Error* err;
|
|
int line = prev()->line;
|
|
bool parsing_dict = false; // {...} may be dict or set
|
|
int count = 0;
|
|
do {
|
|
check_newlines_repl();
|
|
if(curr()->type == TK_RBRACE) break;
|
|
check(EXPR(self)); // [key]
|
|
if(curr()->type == TK_COLON) { parsing_dict = true; }
|
|
if(parsing_dict) {
|
|
consume(TK_COLON);
|
|
check(EXPR(self)); // [key, value]
|
|
}
|
|
count += 1; // key-value pair count
|
|
check_newlines_repl();
|
|
if(count == 1 && match(TK_FOR)) {
|
|
if(parsing_dict) {
|
|
check(consume_comp(self, OP_BUILD_DICT, OP_DICT_ADD));
|
|
} else {
|
|
check(consume_comp(self, OP_BUILD_SET, OP_SET_ADD));
|
|
}
|
|
consume(TK_RBRACE);
|
|
return NULL;
|
|
}
|
|
check_newlines_repl();
|
|
} while(match(TK_COMMA));
|
|
consume(TK_RBRACE);
|
|
|
|
SequenceExpr* se;
|
|
if(count == 0 || parsing_dict) {
|
|
count *= 2; // key + value
|
|
se = DictExpr__new(line, count);
|
|
} else {
|
|
se = SetExpr__new(line, count);
|
|
}
|
|
for(int i = count - 1; i >= 0; i--) {
|
|
c11__setitem(Expr*, &se->items, i, Ctx__s_popx(ctx()));
|
|
}
|
|
Ctx__s_push(ctx(), (Expr*)se);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprCall(Compiler* self) {
|
|
Error* err;
|
|
CallExpr* e = CallExpr__new(prev()->line, Ctx__s_popx(ctx()));
|
|
Ctx__s_push(ctx(), (Expr*)e); // push onto the stack in advance
|
|
do {
|
|
check_newlines_repl();
|
|
if(curr()->type == TK_RPAREN) break;
|
|
if(curr()->type == TK_ID && next()->type == TK_ASSIGN) {
|
|
consume(TK_ID);
|
|
py_Name key = py_name2(Token__sv(prev()));
|
|
consume(TK_ASSIGN);
|
|
check(EXPR(self));
|
|
CallExprKwArg kw = {key, Ctx__s_popx(ctx())};
|
|
c11_vector__push(CallExprKwArg, &e->kwargs, kw);
|
|
} else {
|
|
check(EXPR(self));
|
|
int star_level = 0;
|
|
Expr* top = Ctx__s_top(ctx());
|
|
if(top->vt->is_starred) star_level = ((StarredExpr*)top)->level;
|
|
if(star_level == 2) {
|
|
// **kwargs
|
|
CallExprKwArg kw = {0, Ctx__s_popx(ctx())};
|
|
c11_vector__push(CallExprKwArg, &e->kwargs, kw);
|
|
} else {
|
|
// positional argument
|
|
if(e->kwargs.count > 0) {
|
|
return SyntaxError("positional argument follows keyword argument");
|
|
}
|
|
c11_vector__push(Expr*, &e->args, Ctx__s_popx(ctx()));
|
|
}
|
|
}
|
|
check_newlines_repl();
|
|
} while(match(TK_COMMA));
|
|
consume(TK_RPAREN);
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprSlice0(Compiler* self) {
|
|
Error* err;
|
|
SliceExpr* slice = SliceExpr__new(prev()->line);
|
|
Ctx__s_push(ctx(), (Expr*)slice); // push onto the stack in advance
|
|
if(is_expression(self, false)) { // :<stop>
|
|
check(EXPR(self));
|
|
slice->stop = Ctx__s_popx(ctx());
|
|
// try optional step
|
|
if(match(TK_COLON)) { // :<stop>:<step>
|
|
check(EXPR(self));
|
|
slice->step = Ctx__s_popx(ctx());
|
|
}
|
|
} else if(match(TK_COLON)) {
|
|
if(is_expression(self, false)) { // ::<step>
|
|
check(EXPR(self));
|
|
slice->step = Ctx__s_popx(ctx());
|
|
} // else ::
|
|
} // else :
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprSlice1(Compiler* self) {
|
|
Error* err;
|
|
SliceExpr* slice = SliceExpr__new(prev()->line);
|
|
slice->start = Ctx__s_popx(ctx());
|
|
Ctx__s_push(ctx(), (Expr*)slice); // push onto the stack in advance
|
|
if(is_expression(self, false)) { // <start>:<stop>
|
|
check(EXPR(self));
|
|
slice->stop = Ctx__s_popx(ctx());
|
|
// try optional step
|
|
if(match(TK_COLON)) { // <start>:<stop>:<step>
|
|
check(EXPR(self));
|
|
slice->step = Ctx__s_popx(ctx());
|
|
}
|
|
} else if(match(TK_COLON)) { // <start>::<step>
|
|
check(EXPR(self));
|
|
slice->step = Ctx__s_popx(ctx());
|
|
} // else <start>:
|
|
return NULL;
|
|
}
|
|
|
|
static Error* exprSubscr(Compiler* self) {
|
|
Error* err;
|
|
int line = prev()->line;
|
|
check_newlines_repl();
|
|
check(EXPR_TUPLE_ALLOW_SLICE(self, true));
|
|
check_newlines_repl();
|
|
consume(TK_RBRACKET); // [lhs, rhs]
|
|
SubscrExpr* e = SubscrExpr__new(line);
|
|
e->rhs = Ctx__s_popx(ctx()); // [lhs]
|
|
e->lhs = Ctx__s_popx(ctx()); // []
|
|
Ctx__s_push(ctx(), (Expr*)e);
|
|
return NULL;
|
|
}
|
|
|
|
////////////////
|
|
static Error* consume_type_hints(Compiler* self) {
|
|
Error* err;
|
|
check(EXPR(self));
|
|
Ctx__s_pop(ctx());
|
|
return NULL;
|
|
}
|
|
|
|
Error* try_compile_assignment(Compiler* self, bool* is_assign) {
|
|
Error* err;
|
|
switch(curr()->type) {
|
|
case TK_IADD:
|
|
case TK_ISUB:
|
|
case TK_IMUL:
|
|
case TK_IDIV:
|
|
case TK_IFLOORDIV:
|
|
case TK_IMOD:
|
|
case TK_ILSHIFT:
|
|
case TK_IRSHIFT:
|
|
case TK_IAND:
|
|
case TK_IOR:
|
|
case TK_IXOR: {
|
|
if(Ctx__s_top(ctx())->vt->is_starred) return SyntaxError();
|
|
if(ctx()->is_compiling_class) {
|
|
return SyntaxError("can't use inplace operator in class definition");
|
|
}
|
|
advance();
|
|
// a[x] += 1; a and x should be evaluated only once
|
|
// a.x += 1; a should be evaluated only once
|
|
// -1 to remove =; inplace=true
|
|
int line = prev()->line;
|
|
TokenIndex op = (TokenIndex)(prev()->type - 1);
|
|
// [lhs]
|
|
check(EXPR_TUPLE(self)); // [lhs, rhs]
|
|
if(Ctx__s_top(ctx())->vt->is_starred) return SyntaxError();
|
|
BinaryExpr* e = BinaryExpr__new(line, op, true);
|
|
e->rhs = Ctx__s_popx(ctx()); // [lhs]
|
|
e->lhs = Ctx__s_popx(ctx()); // []
|
|
vtemit_((Expr*)e, ctx());
|
|
bool ok = vtemit_istore(e->lhs, ctx());
|
|
vtdelete((Expr*)e);
|
|
if(!ok) return SyntaxError();
|
|
*is_assign = true;
|
|
return NULL;
|
|
}
|
|
case TK_ASSIGN: {
|
|
int n = 0;
|
|
while(match(TK_ASSIGN)) {
|
|
check(EXPR_TUPLE(self));
|
|
n += 1;
|
|
}
|
|
// stack size is n+1
|
|
Ctx__s_emit_top(ctx());
|
|
for(int j = 1; j < n; j++)
|
|
Ctx__emit_(ctx(), OP_DUP_TOP, BC_NOARG, BC_KEEPLINE);
|
|
for(int j = 0; j < n; j++) {
|
|
if(Ctx__s_top(ctx())->vt->is_starred) return SyntaxError();
|
|
Expr* e = Ctx__s_top(ctx());
|
|
bool ok = vtemit_store(e, ctx());
|
|
Ctx__s_pop(ctx());
|
|
if(!ok) return SyntaxError();
|
|
}
|
|
*is_assign = true;
|
|
return NULL;
|
|
}
|
|
default: *is_assign = false;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
static Error* compile_stmt(Compiler* self) {
|
|
Error* err;
|
|
if(match(TK_CLASS)) {
|
|
// check(compile_class());
|
|
assert(false);
|
|
return NULL;
|
|
}
|
|
advance();
|
|
int kw_line = prev()->line; // backup line number
|
|
int curr_loop_block = Ctx__get_loop(ctx());
|
|
switch(prev()->type) {
|
|
case TK_BREAK:
|
|
if(curr_loop_block < 0) return SyntaxError("'break' outside loop");
|
|
Ctx__emit_(ctx(), OP_LOOP_BREAK, curr_loop_block, kw_line);
|
|
consume_end_stmt();
|
|
break;
|
|
case TK_CONTINUE:
|
|
if(curr_loop_block < 0) return SyntaxError("'continue' not properly in loop");
|
|
Ctx__emit_(ctx(), OP_LOOP_CONTINUE, curr_loop_block, kw_line);
|
|
consume_end_stmt();
|
|
break;
|
|
case TK_YIELD:
|
|
if(self->contexts.count <= 1) return SyntaxError("'yield' outside function");
|
|
check(EXPR_TUPLE(self));
|
|
Ctx__s_emit_top(ctx());
|
|
Ctx__emit_(ctx(), OP_YIELD_VALUE, BC_NOARG, kw_line);
|
|
consume_end_stmt();
|
|
break;
|
|
case TK_YIELD_FROM:
|
|
if(self->contexts.count <= 1) return SyntaxError("'yield from' outside function");
|
|
check(EXPR_TUPLE(self));
|
|
Ctx__s_emit_top(ctx());
|
|
Ctx__emit_(ctx(), OP_GET_ITER_NEW, BC_NOARG, kw_line);
|
|
Ctx__enter_block(ctx(), CodeBlockType_FOR_LOOP);
|
|
Ctx__emit_(ctx(), OP_FOR_ITER_YIELD_VALUE, BC_NOARG, kw_line);
|
|
Ctx__emit_(ctx(), OP_LOOP_CONTINUE, Ctx__get_loop(ctx()), kw_line);
|
|
Ctx__exit_block(ctx());
|
|
consume_end_stmt();
|
|
break;
|
|
case TK_RETURN:
|
|
if(self->contexts.count <= 1) return SyntaxError("'return' outside function");
|
|
if(match_end_stmt(self)) {
|
|
Ctx__emit_(ctx(), OP_RETURN_VALUE, 1, kw_line);
|
|
} else {
|
|
check(EXPR_TUPLE(self));
|
|
Ctx__s_emit_top(ctx());
|
|
consume_end_stmt();
|
|
Ctx__emit_(ctx(), OP_RETURN_VALUE, BC_NOARG, kw_line);
|
|
}
|
|
break;
|
|
/*************************************************/
|
|
// case TK_IF: check(compile_if_stmt()); break;
|
|
// case TK_WHILE: check(compile_while_loop()); break;
|
|
// case TK_FOR: check(compile_for_loop()); break;
|
|
// case TK_IMPORT: check(compile_normal_import()); break;
|
|
// case TK_FROM: check(compile_from_import()); break;
|
|
// case TK_DEF: check(compile_function()); break;
|
|
// case TK_DECORATOR: check(compile_decorated()); break;
|
|
// case TK_TRY: check(compile_try_except()); break;
|
|
case TK_PASS: consume_end_stmt(); break;
|
|
/*************************************************/
|
|
case TK_ASSERT: {
|
|
check(EXPR(self)); // condition
|
|
Ctx__s_emit_top(ctx());
|
|
int index = Ctx__emit_(ctx(), OP_POP_JUMP_IF_TRUE, BC_NOARG, kw_line);
|
|
int has_msg = 0;
|
|
if(match(TK_COMMA)) {
|
|
check(EXPR(self)); // message
|
|
Ctx__s_emit_top(ctx());
|
|
has_msg = 1;
|
|
}
|
|
Ctx__emit_(ctx(), OP_RAISE_ASSERT, has_msg, kw_line);
|
|
Ctx__patch_jump(ctx(), index);
|
|
consume_end_stmt();
|
|
break;
|
|
}
|
|
case TK_GLOBAL:
|
|
do {
|
|
consume(TK_ID);
|
|
py_Name name = py_name2(Token__sv(prev()));
|
|
c11_smallmap_n2i__set(&ctx()->global_names, name, 0);
|
|
} while(match(TK_COMMA));
|
|
consume_end_stmt();
|
|
break;
|
|
case TK_RAISE: {
|
|
check(EXPR(self));
|
|
Ctx__s_emit_top(ctx());
|
|
Ctx__emit_(ctx(), OP_RAISE, BC_NOARG, kw_line);
|
|
consume_end_stmt();
|
|
} break;
|
|
case TK_DEL: {
|
|
check(EXPR_TUPLE(self));
|
|
Expr* e = Ctx__s_top(ctx());
|
|
if(!vtemit_del(e, ctx())) return SyntaxError();
|
|
Ctx__s_pop(ctx());
|
|
consume_end_stmt();
|
|
} break;
|
|
// case TK_WITH: {
|
|
// check(EXPR(self)); // [ <expr> ]
|
|
// Ctx__s_emit_top(ctx());
|
|
// Ctx__enter_block(ctx(), CodeBlockType_CONTEXT_MANAGER);
|
|
// Expr* as_name = nullptr;
|
|
// if(match(TK_AS)) {
|
|
// consume(TK_ID);
|
|
// as_name = make_expr<NameExpr>(prev().str(), name_scope());
|
|
// }
|
|
// Ctx__emit_(ctx(), OP_WITH_ENTER, BC_NOARG, prev().line);
|
|
// // [ <expr> <expr>.__enter__() ]
|
|
// if(as_name) {
|
|
// bool ok = as_name->emit_store(ctx());
|
|
// delete_expr(as_name);
|
|
// if(!ok) return SyntaxError();
|
|
// } else {
|
|
// Ctx__emit_(ctx(), OP_POP_TOP, BC_NOARG, BC_KEEPLINE);
|
|
// }
|
|
// check(compile_block_body());
|
|
// Ctx__emit_(ctx(), OP_WITH_EXIT, BC_NOARG, prev().line);
|
|
// Ctx__exit_block(ctx());
|
|
// } break;
|
|
/*************************************************/
|
|
case TK_EQ: {
|
|
consume(TK_ID);
|
|
if(mode() != EXEC_MODE) return SyntaxError("'label' is only available in EXEC_MODE");
|
|
c11_sv name = Token__sv(prev());
|
|
bool ok = Ctx__add_label(ctx(), py_name2(name));
|
|
if(!ok) return SyntaxError("label %q already exists", name);
|
|
consume(TK_EQ);
|
|
consume_end_stmt();
|
|
} break;
|
|
case TK_ARROW:
|
|
consume(TK_ID);
|
|
if(mode() != EXEC_MODE) return SyntaxError("'goto' is only available in EXEC_MODE");
|
|
py_Name name = py_name2(Token__sv(prev()));
|
|
Ctx__emit_(ctx(), OP_GOTO, name, prev()->line);
|
|
consume_end_stmt();
|
|
break;
|
|
/*************************************************/
|
|
// handle dangling expression or assignment
|
|
default: {
|
|
// do revert since we have pre-called advance() at the beginning
|
|
--self->i;
|
|
|
|
check(EXPR_TUPLE(self));
|
|
|
|
bool is_typed_name = false; // e.g. x: int
|
|
// eat variable's type hint if it is a single name
|
|
if(Ctx__s_top(ctx())->vt->is_name) {
|
|
if(match(TK_COLON)) {
|
|
check(consume_type_hints(self));
|
|
is_typed_name = true;
|
|
|
|
if(ctx()->is_compiling_class) {
|
|
NameExpr* ne = (NameExpr*)Ctx__s_top(ctx());
|
|
Ctx__emit_(ctx(), OP_ADD_CLASS_ANNOTATION, ne->name, BC_KEEPLINE);
|
|
}
|
|
}
|
|
}
|
|
bool is_assign = false;
|
|
check(try_compile_assignment(self, &is_assign));
|
|
if(!is_assign) {
|
|
if(Ctx__s_size(ctx()) > 0 && Ctx__s_top(ctx())->vt->is_starred) {
|
|
return SyntaxError();
|
|
}
|
|
if(!is_typed_name) {
|
|
Ctx__s_emit_top(ctx());
|
|
if((mode() == CELL_MODE || mode() == REPL_MODE) &&
|
|
name_scope(self) == NAME_GLOBAL) {
|
|
Ctx__emit_(ctx(), OP_PRINT_EXPR, BC_NOARG, BC_KEEPLINE);
|
|
} else {
|
|
Ctx__emit_(ctx(), OP_POP_TOP, BC_NOARG, BC_KEEPLINE);
|
|
}
|
|
} else {
|
|
Ctx__s_pop(ctx());
|
|
}
|
|
}
|
|
consume_end_stmt();
|
|
break;
|
|
}
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
/////////////////////////////////////////////////////////////////
|
|
|
|
Error* Compiler__compile(Compiler* self, CodeObject* out) {
|
|
// make sure it is the first time to compile
|
|
assert(self->i == 0);
|
|
// make sure the first token is @sof
|
|
assert(tk(0)->type == TK_SOF);
|
|
|
|
push_global_context(self, out);
|
|
|
|
advance(); // skip @sof, so prev() is always valid
|
|
match_newlines(); // skip possible leading '\n'
|
|
|
|
Error* err;
|
|
if(mode() == EVAL_MODE) {
|
|
check(EXPR_TUPLE(self));
|
|
Ctx__s_emit_top(ctx());
|
|
consume(TK_EOF);
|
|
Ctx__emit_(ctx(), OP_RETURN_VALUE, BC_NOARG, BC_KEEPLINE);
|
|
check(pop_context(self));
|
|
return NULL;
|
|
} else if(mode() == JSON_MODE) {
|
|
check(EXPR(self));
|
|
Expr* e = Ctx__s_popx(ctx());
|
|
if(!e->vt->is_json_object) { return SyntaxError("expect a JSON object, literal or array"); }
|
|
consume(TK_EOF);
|
|
vtemit_(e, ctx());
|
|
Ctx__emit_(ctx(), OP_RETURN_VALUE, BC_NOARG, BC_KEEPLINE);
|
|
check(pop_context(self));
|
|
return NULL;
|
|
}
|
|
|
|
while(!match(TK_EOF)) {
|
|
check(compile_stmt(self));
|
|
match_newlines();
|
|
}
|
|
check(pop_context(self));
|
|
return NULL;
|
|
}
|
|
|
|
Error* pk_compile(pk_SourceData_ src, CodeObject* out) {
|
|
pk_TokenArray tokens;
|
|
Error* err = pk_Lexer__process(src, &tokens);
|
|
if(err) return err;
|
|
|
|
Token* data = (Token*)tokens.data;
|
|
printf("%s\n", src->filename->data);
|
|
for(int i = 0; i < tokens.count; i++) {
|
|
Token* t = data + i;
|
|
c11_string* tmp = c11_string__new2(t->start, t->length);
|
|
printf("[%d] %s: %s\n", t->line, pk_TokenSymbols[t->type], tmp->data);
|
|
c11_string__delete(tmp);
|
|
}
|
|
|
|
Compiler compiler;
|
|
Compiler__ctor(&compiler, src, tokens);
|
|
CodeObject__ctor(out, src, c11_string__sv(src->filename));
|
|
err = Compiler__compile(&compiler, out);
|
|
if(err) {
|
|
// dispose the code object if error occurs
|
|
CodeObject__dtor(out);
|
|
}
|
|
Compiler__dtor(&compiler);
|
|
return err;
|
|
}
|
|
|
|
// clang-format off
|
|
const static PrattRule rules[TK__COUNT__] = {
|
|
// http://journal.stuffwithstuff.com/2011/03/19/pratt-parsers-expression-parsing-made-easy/
|
|
[TK_DOT] = { NULL, exprAttrib, PREC_PRIMARY },
|
|
[TK_LPAREN] = { exprGroup, exprCall, PREC_PRIMARY },
|
|
[TK_LBRACKET] = { exprList, exprSubscr, PREC_PRIMARY },
|
|
[TK_MOD] = { NULL, exprBinaryOp, PREC_FACTOR },
|
|
[TK_ADD] = { NULL, exprBinaryOp, PREC_TERM },
|
|
[TK_SUB] = { exprUnaryOp, exprBinaryOp, PREC_TERM },
|
|
[TK_MUL] = { exprUnaryOp, exprBinaryOp, PREC_FACTOR },
|
|
[TK_INVERT] = { exprUnaryOp, NULL, PREC_UNARY },
|
|
[TK_DIV] = { NULL, exprBinaryOp, PREC_FACTOR },
|
|
[TK_FLOORDIV] = { NULL, exprBinaryOp, PREC_FACTOR },
|
|
[TK_POW] = { exprUnaryOp, exprBinaryOp, PREC_EXPONENT },
|
|
[TK_GT] = { NULL, exprBinaryOp, PREC_COMPARISION },
|
|
[TK_LT] = { NULL, exprBinaryOp, PREC_COMPARISION },
|
|
[TK_EQ] = { NULL, exprBinaryOp, PREC_COMPARISION },
|
|
[TK_NE] = { NULL, exprBinaryOp, PREC_COMPARISION },
|
|
[TK_GE] = { NULL, exprBinaryOp, PREC_COMPARISION },
|
|
[TK_LE] = { NULL, exprBinaryOp, PREC_COMPARISION },
|
|
[TK_IN] = { NULL, exprBinaryOp, PREC_COMPARISION },
|
|
[TK_IS] = { NULL, exprBinaryOp, PREC_COMPARISION },
|
|
[TK_LSHIFT] = { NULL, exprBinaryOp, PREC_BITWISE_SHIFT },
|
|
[TK_RSHIFT] = { NULL, exprBinaryOp, PREC_BITWISE_SHIFT },
|
|
[TK_AND] = { NULL, exprBinaryOp, PREC_BITWISE_AND },
|
|
[TK_OR] = { NULL, exprBinaryOp, PREC_BITWISE_OR },
|
|
[TK_XOR] = { NULL, exprBinaryOp, PREC_BITWISE_XOR },
|
|
[TK_DECORATOR] = { NULL, exprBinaryOp, PREC_FACTOR },
|
|
[TK_IF] = { NULL, exprTernary, PREC_TERNARY },
|
|
[TK_NOT_IN] = { NULL, exprBinaryOp, PREC_COMPARISION },
|
|
[TK_IS_NOT] = { NULL, exprBinaryOp, PREC_COMPARISION },
|
|
[TK_AND_KW ] = { NULL, exprAnd, PREC_LOGICAL_AND },
|
|
[TK_OR_KW] = { NULL, exprOr, PREC_LOGICAL_OR },
|
|
[TK_NOT_KW] = { exprNot, NULL, PREC_LOGICAL_NOT },
|
|
[TK_TRUE] = { exprLiteral0 },
|
|
[TK_FALSE] = { exprLiteral0 },
|
|
[TK_NONE] = { exprLiteral0 },
|
|
[TK_DOTDOTDOT] = { exprLiteral0 },
|
|
[TK_LAMBDA] = { exprLambda, },
|
|
[TK_ID] = { exprName, },
|
|
[TK_NUM] = { exprLiteral, },
|
|
[TK_STR] = { exprLiteral, },
|
|
[TK_FSTR] = { exprFString, },
|
|
[TK_LONG] = { exprLong, },
|
|
[TK_IMAG] = { exprImag, },
|
|
[TK_BYTES] = { exprBytes, },
|
|
[TK_LBRACE] = { exprMap },
|
|
[TK_COLON] = { exprSlice0, exprSlice1, PREC_PRIMARY }
|
|
};
|
|
// clang-format on
|