From 3a10784fbd754b2010433c9137c7bf2a66dd3d7c Mon Sep 17 00:00:00 2001 From: BLUELOVETH Date: Sun, 30 Apr 2023 16:54:29 +0000 Subject: [PATCH] ... --- amalgamate.py | 2 +- src/base64.h | 193 +++++++++++++++++++++++++++++++++++++++++++++ src/pocketpy.h | 2 + tests/70_base64.py | 9 +++ 4 files changed, 205 insertions(+), 1 deletion(-) create mode 100644 src/base64.h create mode 100644 tests/70_base64.py diff --git a/amalgamate.py b/amalgamate.py index e3614989..7e16900a 100644 --- a/amalgamate.py +++ b/amalgamate.py @@ -9,7 +9,7 @@ pipeline = [ ["common.h", "memory.h", "vector.h", "str.h", "tuplelist.h", "namedict.h", "error.h", "lexer.h"], ["obj.h", "codeobject.h", "frame.h"], ["gc.h", "vm.h", "ceval.h", "expr.h", "compiler.h", "repl.h"], - ["_generated.h", "iter.h", "cffi.h", "requests.h", "io.h", "pocketpy.h"] + ["_generated.h", "iter.h", "base64.h", "cffi.h", "requests.h", "io.h", "pocketpy.h"] ] copied = set() diff --git a/src/base64.h b/src/base64.h new file mode 100644 index 00000000..de5b3331 --- /dev/null +++ b/src/base64.h @@ -0,0 +1,193 @@ +#pragma once + +#include "common.h" +#include "vm.h" + +namespace pkpy { + +// https://github.com/zhicheng/base64/blob/master/base64.c + +#define BASE64_PAD '=' +#define BASE64DE_FIRST '+' +#define BASE64DE_LAST 'z' + +/* BASE 64 encode table */ +static const char base64en[] = { + 'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', + 'I', 'J', 'K', 'L', 'M', 'N', 'O', 'P', + 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', + 'Y', 'Z', 'a', 'b', 'c', 'd', 'e', 'f', + 'g', 'h', 'i', 'j', 'k', 'l', 'm', 'n', + 'o', 'p', 'q', 'r', 's', 't', 'u', 'v', + 'w', 'x', 'y', 'z', '0', '1', '2', '3', + '4', '5', '6', '7', '8', '9', '+', '/', +}; + +/* ASCII order for BASE 64 decode, 255 in unused character */ +static const unsigned char base64de[] = { + /* nul, soh, stx, etx, eot, enq, ack, bel, */ + 255, 255, 255, 255, 255, 255, 255, 255, + + /* bs, ht, nl, vt, np, cr, so, si, */ + 255, 255, 255, 255, 255, 255, 255, 255, + + /* dle, dc1, dc2, dc3, dc4, nak, syn, etb, */ + 255, 255, 255, 255, 255, 255, 255, 255, + + /* can, em, sub, esc, fs, gs, rs, us, */ + 255, 255, 255, 255, 255, 255, 255, 255, + + /* sp, '!', '"', '#', '$', '%', '&', ''', */ + 255, 255, 255, 255, 255, 255, 255, 255, + + /* '(', ')', '*', '+', ',', '-', '.', '/', */ + 255, 255, 255, 62, 255, 255, 255, 63, + + /* '0', '1', '2', '3', '4', '5', '6', '7', */ + 52, 53, 54, 55, 56, 57, 58, 59, + + /* '8', '9', ':', ';', '<', '=', '>', '?', */ + 60, 61, 255, 255, 255, 255, 255, 255, + + /* '@', 'A', 'B', 'C', 'D', 'E', 'F', 'G', */ + 255, 0, 1, 2, 3, 4, 5, 6, + + /* 'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O', */ + 7, 8, 9, 10, 11, 12, 13, 14, + + /* 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', */ + 15, 16, 17, 18, 19, 20, 21, 22, + + /* 'X', 'Y', 'Z', '[', '\', ']', '^', '_', */ + 23, 24, 25, 255, 255, 255, 255, 255, + + /* '`', 'a', 'b', 'c', 'd', 'e', 'f', 'g', */ + 255, 26, 27, 28, 29, 30, 31, 32, + + /* 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o', */ + 33, 34, 35, 36, 37, 38, 39, 40, + + /* 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', */ + 41, 42, 43, 44, 45, 46, 47, 48, + + /* 'x', 'y', 'z', '{', '|', '}', '~', del, */ + 49, 50, 51, 255, 255, 255, 255, 255 +}; + +unsigned int +base64_encode(const unsigned char *in, unsigned int inlen, char *out) +{ + int s; + unsigned int i; + unsigned int j; + unsigned char c; + unsigned char l; + + s = 0; + l = 0; + for (i = j = 0; i < inlen; i++) { + c = in[i]; + + switch (s) { + case 0: + s = 1; + out[j++] = base64en[(c >> 2) & 0x3F]; + break; + case 1: + s = 2; + out[j++] = base64en[((l & 0x3) << 4) | ((c >> 4) & 0xF)]; + break; + case 2: + s = 0; + out[j++] = base64en[((l & 0xF) << 2) | ((c >> 6) & 0x3)]; + out[j++] = base64en[c & 0x3F]; + break; + } + l = c; + } + + switch (s) { + case 1: + out[j++] = base64en[(l & 0x3) << 4]; + out[j++] = BASE64_PAD; + out[j++] = BASE64_PAD; + break; + case 2: + out[j++] = base64en[(l & 0xF) << 2]; + out[j++] = BASE64_PAD; + break; + } + + out[j] = 0; + + return j; +} + +unsigned int +base64_decode(const char *in, unsigned int inlen, unsigned char *out) +{ + unsigned int i; + unsigned int j; + unsigned char c; + + if (inlen & 0x3) { + return 0; + } + + for (i = j = 0; i < inlen; i++) { + if (in[i] == BASE64_PAD) { + break; + } + if (in[i] < BASE64DE_FIRST || in[i] > BASE64DE_LAST) { + return 0; + } + + c = base64de[(unsigned char)in[i]]; + if (c == 255) { + return 0; + } + + switch (i & 0x3) { + case 0: + out[j] = (c << 2) & 0xFF; + break; + case 1: + out[j++] |= (c >> 4) & 0x3; + out[j] = (c & 0xF) << 4; + break; + case 2: + out[j++] |= (c >> 2) & 0xF; + out[j] = (c & 0x3) << 6; + break; + case 3: + out[j++] |= c; + break; + } + } + + return j; +} + +void add_module_base64(VM* vm){ + PyObject* mod = vm->new_module("base64"); + + // b64encode + vm->bind_static_method<1>(mod, "b64encode", [](VM* vm, ArgsView args){ + Bytes& b = CAST(Bytes&, args[0]); + std::vector out(b.size() * 2); + int size = base64_encode((const unsigned char*)b.data(), b.size(), out.data()); + out.resize(size); + return VAR(Bytes(std::move(out))); + }); + + // b64decode + vm->bind_static_method<1>(mod, "b64decode", [](VM* vm, ArgsView args){ + Bytes& b = CAST(Bytes&, args[0]); + std::vector out(b.size()); + int size = base64_decode(b.data(), b.size(), (unsigned char*)out.data()); + out.resize(size); + return VAR(Bytes(std::move(out))); + }); +} + +} // namespace pkpy \ No newline at end of file diff --git a/src/pocketpy.h b/src/pocketpy.h index 6b3f0b45..076d2f47 100644 --- a/src/pocketpy.h +++ b/src/pocketpy.h @@ -5,6 +5,7 @@ #include "obj.h" #include "repl.h" #include "iter.h" +#include "base64.h" #include "cffi.h" #include "requests.h" #include "io.h" @@ -920,6 +921,7 @@ inline void VM::post_init(){ add_module_c(this); add_module_gc(this); add_module_random(this); + add_module_base64(this); for(const char* name: {"this", "functools", "collections", "heapq", "bisect"}){ _lazy_modules[name] = kPythonLibs[name]; diff --git a/tests/70_base64.py b/tests/70_base64.py new file mode 100644 index 00000000..cf272572 --- /dev/null +++ b/tests/70_base64.py @@ -0,0 +1,9 @@ +a = '测试 123' +a = a.encode() + +import base64 + +b = base64.b64encode(a) +c = base64.b64decode(b) + +assert a == c