diff options
| author | Damien George <damien.p.george@gmail.com> | 2019-03-01 14:33:03 +1100 | 
|---|---|---|
| committer | Damien George <damien.p.george@gmail.com> | 2019-03-05 16:32:05 +1100 | 
| commit | 4f0931b21f72be86aae22f05b718aa36792afc9b (patch) | |
| tree | 6ed029f6bc5ef4ee9b125f50e7795220232d5f14 /py | |
| parent | 992a6e1deab06aba07ab09687402d39a0c028a73 (diff) | |
py/persistentcode: Define static qstr set to reduce size of mpy files.
When encoded in the mpy file, if qstr <= QSTR_LAST_STATIC then store two
bytes: 0, static_qstr_id.  Otherwise encode the qstr as usual (either with
string data or a reference into the qstr window).
Reduces mpy file size by about 5%.
Diffstat (limited to 'py')
| -rw-r--r-- | py/makeqstrdata.py | 185 | ||||
| -rw-r--r-- | py/persistentcode.c | 12 | 
2 files changed, 196 insertions, 1 deletions
| diff --git a/py/makeqstrdata.py b/py/makeqstrdata.py index 3c0a60909..060ebb7fd 100644 --- a/py/makeqstrdata.py +++ b/py/makeqstrdata.py @@ -51,6 +51,176 @@ codepoint2name[ord('^')] = 'caret'  codepoint2name[ord('|')] = 'pipe'  codepoint2name[ord('~')] = 'tilde' +# static qstrs, should be sorted + +static_qstr_list = [ +    "", +    "__dir__", # Put __dir__ after empty qstr for builtin dir() to work +    "\n", +    " ", +    "*", +    "/", +    "<module>", +    "_", +    "__call__", +    "__class__", +    "__delitem__", +    "__enter__", +    "__exit__", +    "__getattr__", +    "__getitem__", +    "__hash__", +    "__init__", +    "__int__", +    "__iter__", +    "__len__", +    "__main__", +    "__module__", +    "__name__", +    "__new__", +    "__next__", +    "__qualname__", +    "__repr__", +    "__setitem__", +    "__str__", +    "ArithmeticError", +    "AssertionError", +    "AttributeError", +    "BaseException", +    "EOFError", +    "Ellipsis", +    "Exception", +    "GeneratorExit", +    "ImportError", +    "IndentationError", +    "IndexError", +    "KeyError", +    "KeyboardInterrupt", +    "LookupError", +    "MemoryError", +    "NameError", +    "NoneType", +    "NotImplementedError", +    "OSError", +    "OverflowError", +    "RuntimeError", +    "StopIteration", +    "SyntaxError", +    "SystemExit", +    "TypeError", +    "ValueError", +    "ZeroDivisionError", +    "abs", +    "all", +    "any", +    "append", +    "args", +    "bool", +    "builtins", +    "bytearray", +    "bytecode", +    "bytes", +    "callable", +    "chr", +    "classmethod", +    "clear", +    "close", +    "const", +    "copy", +    "count", +    "dict", +    "dir", +    "divmod", +    "end", +    "endswith", +    "eval", +    "exec", +    "extend", +    "find", +    "format", +    "from_bytes", +    "get", +    "getattr", +    "globals", +    "hasattr", +    "hash", +    "id", +    "index", +    "insert", +    "int", +    "isalpha", +    "isdigit", +    "isinstance", +    "islower", +    "isspace", +    "issubclass", +    "isupper", +    "items", +    "iter", +    "join", +    "key", +    "keys", +    "len", +    "list", +    "little", +    "locals", +    "lower", +    "lstrip", +    "main", +    "map", +    "micropython", +    "next", +    "object", +    "open", +    "ord", +    "pop", +    "popitem", +    "pow", +    "print", +    "range", +    "read", +    "readinto", +    "readline", +    "remove", +    "replace", +    "repr", +    "reverse", +    "rfind", +    "rindex", +    "round", +    "rsplit", +    "rstrip", +    "self", +    "send", +    "sep", +    "set", +    "setattr", +    "setdefault", +    "sort", +    "sorted", +    "split", +    "start", +    "startswith", +    "staticmethod", +    "step", +    "stop", +    "str", +    "strip", +    "sum", +    "super", +    "throw", +    "to_bytes", +    "tuple", +    "type", +    "update", +    "upper", +    "utf-8", +    "value", +    "values", +    "write", +    "zip", +] +  # this must match the equivalent function in qstr.c  def compute_hash(qstr, bytes_hash):      hash = 5381 @@ -70,9 +240,22 @@ def qstr_escape(qst):      return re.sub(r'[^A-Za-z0-9_]', esc_char, qst)  def parse_input_headers(infiles): -    # read the qstrs in from the input files      qcfgs = {}      qstrs = {} + +    # add static qstrs +    for qstr in static_qstr_list: +        # work out the corresponding qstr name +        ident = qstr_escape(qstr) + +        # don't add duplicates +        assert ident not in qstrs + +        # add the qstr to the list, with order number to retain original order in file +        order = len(qstrs) - 300000 +        qstrs[ident] = (order, ident, qstr) + +    # read the qstrs in from the input files      for infile in infiles:          with open(infile, 'rt') as f:              for line in f: diff --git a/py/persistentcode.c b/py/persistentcode.c index d47425db9..c0a328111 100644 --- a/py/persistentcode.c +++ b/py/persistentcode.c @@ -38,6 +38,8 @@  #include "py/smallint.h" +#define QSTR_LAST_STATIC MP_QSTR_zip +  // The current version of .mpy files  #define MPY_VERSION (3) @@ -187,6 +189,10 @@ STATIC size_t read_uint(mp_reader_t *reader, byte **out) {  STATIC qstr load_qstr(mp_reader_t *reader, qstr_window_t *qw) {      size_t len = read_uint(reader, NULL); +    if (len == 0) { +        // static qstr +        return read_byte(reader); +    }      if (len & 1) {          // qstr in window          return qstr_window_access(qw, len >> 1); @@ -362,6 +368,12 @@ STATIC void mp_print_uint(mp_print_t *print, size_t n) {  }  STATIC void save_qstr(mp_print_t *print, qstr_window_t *qw, qstr qst) { +    if (qst <= QSTR_LAST_STATIC) { +        // encode static qstr +        byte buf[2] = {0, qst & 0xff}; +        mp_print_bytes(print, buf, 2); +        return; +    }      size_t idx = qstr_window_insert(qw, qst);      if (idx < QSTR_WINDOW_SIZE) {          // qstr found in window, encode index to it | 
