1 /*
2  * This file is part of the MicroPython project, http://micropython.org/
3  *
4  * The MIT License (MIT)
5  *
6  * Copyright (c) 2013-2020 Damien P. George
7  *
8  * Permission is hereby granted, free of charge, to any person obtaining a copy
9  * of this software and associated documentation files (the "Software"), to deal
10  * in the Software without restriction, including without limitation the rights
11  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
12  * copies of the Software, and to permit persons to whom the Software is
13  * furnished to do so, subject to the following conditions:
14  *
15  * The above copyright notice and this permission notice shall be included in
16  * all copies or substantial portions of the Software.
17  *
18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
21  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
22  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
23  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
24  * THE SOFTWARE.
25  */
26 
27 #include <stdint.h>
28 #include <stdio.h>
29 #include <string.h>
30 #include <assert.h>
31 
32 #include "py/reader.h"
33 #include "py/nativeglue.h"
34 #include "py/persistentcode.h"
35 #include "py/bc0.h"
36 #include "py/objstr.h"
37 #include "py/mpthread.h"
38 
39 #if MICROPY_PERSISTENT_CODE_LOAD || MICROPY_PERSISTENT_CODE_SAVE
40 
41 #include "py/smallint.h"
42 
43 #define QSTR_LAST_STATIC MP_QSTR_zip
44 
45 #if MICROPY_DYNAMIC_COMPILER
46 #define MPY_FEATURE_ARCH_DYNAMIC mp_dynamic_compiler.native_arch
47 #else
48 #define MPY_FEATURE_ARCH_DYNAMIC MPY_FEATURE_ARCH
49 #endif
50 
51 #if MICROPY_PERSISTENT_CODE_LOAD || (MICROPY_PERSISTENT_CODE_SAVE && !MICROPY_DYNAMIC_COMPILER)
52 // The bytecode will depend on the number of bits in a small-int, and
53 // this function computes that (could make it a fixed constant, but it
54 // would need to be defined in mpconfigport.h).
mp_small_int_bits(void)55 STATIC int mp_small_int_bits(void) {
56     mp_int_t i = MP_SMALL_INT_MAX;
57     int n = 1;
58     while (i != 0) {
59         i >>= 1;
60         ++n;
61     }
62     return n;
63 }
64 #endif
65 
66 #define QSTR_WINDOW_SIZE (32)
67 
68 typedef struct _qstr_window_t {
69     uint16_t idx; // indexes the head of the window
70     uint16_t window[QSTR_WINDOW_SIZE];
71 } qstr_window_t;
72 
73 // Push a qstr to the head of the window, and the tail qstr is overwritten
qstr_window_push(qstr_window_t * qw,qstr qst)74 STATIC void qstr_window_push(qstr_window_t *qw, qstr qst) {
75     qw->idx = (qw->idx + 1) % QSTR_WINDOW_SIZE;
76     qw->window[qw->idx] = qst;
77 }
78 
79 // Pull an existing qstr from within the window to the head of the window
qstr_window_pull(qstr_window_t * qw,size_t idx)80 STATIC qstr qstr_window_pull(qstr_window_t *qw, size_t idx) {
81     qstr qst = qw->window[idx];
82     if (idx > qw->idx) {
83         memmove(&qw->window[idx], &qw->window[idx + 1], (QSTR_WINDOW_SIZE - idx - 1) * sizeof(uint16_t));
84         qw->window[QSTR_WINDOW_SIZE - 1] = qw->window[0];
85         idx = 0;
86     }
87     memmove(&qw->window[idx], &qw->window[idx + 1], (qw->idx - idx) * sizeof(uint16_t));
88     qw->window[qw->idx] = qst;
89     return qst;
90 }
91 
92 #if MICROPY_PERSISTENT_CODE_LOAD
93 
94 // Access a qstr at the given index, relative to the head of the window (0=head)
qstr_window_access(qstr_window_t * qw,size_t idx)95 STATIC qstr qstr_window_access(qstr_window_t *qw, size_t idx) {
96     return qstr_window_pull(qw, (qw->idx + QSTR_WINDOW_SIZE - idx) % QSTR_WINDOW_SIZE);
97 }
98 
99 #endif
100 
101 #if MICROPY_PERSISTENT_CODE_SAVE
102 
103 // Insert a qstr at the head of the window, either by pulling an existing one or pushing a new one
qstr_window_insert(qstr_window_t * qw,qstr qst)104 STATIC size_t qstr_window_insert(qstr_window_t *qw, qstr qst) {
105     for (size_t idx = 0; idx < QSTR_WINDOW_SIZE; ++idx) {
106         if (qw->window[idx] == qst) {
107             qstr_window_pull(qw, idx);
108             return (qw->idx + QSTR_WINDOW_SIZE - idx) % QSTR_WINDOW_SIZE;
109         }
110     }
111     qstr_window_push(qw, qst);
112     return QSTR_WINDOW_SIZE;
113 }
114 
115 #endif
116 
117 typedef struct _bytecode_prelude_t {
118     uint n_state;
119     uint n_exc_stack;
120     uint scope_flags;
121     uint n_pos_args;
122     uint n_kwonly_args;
123     uint n_def_pos_args;
124     uint code_info_size;
125 } bytecode_prelude_t;
126 
127 // ip will point to start of opcodes
128 // return value will point to simple_name, source_file qstrs
extract_prelude(const byte ** ip,bytecode_prelude_t * prelude)129 STATIC byte *extract_prelude(const byte **ip, bytecode_prelude_t *prelude) {
130     MP_BC_PRELUDE_SIG_DECODE(*ip);
131     prelude->n_state = n_state;
132     prelude->n_exc_stack = n_exc_stack;
133     prelude->scope_flags = scope_flags;
134     prelude->n_pos_args = n_pos_args;
135     prelude->n_kwonly_args = n_kwonly_args;
136     prelude->n_def_pos_args = n_def_pos_args;
137     MP_BC_PRELUDE_SIZE_DECODE(*ip);
138     byte *ip_info = (byte *)*ip;
139     *ip += n_info;
140     *ip += n_cell;
141     return ip_info;
142 }
143 
144 #endif // MICROPY_PERSISTENT_CODE_LOAD || MICROPY_PERSISTENT_CODE_SAVE
145 
146 #if MICROPY_PERSISTENT_CODE_LOAD
147 
148 #include "py/parsenum.h"
149 
150 STATIC int read_byte(mp_reader_t *reader);
151 STATIC size_t read_uint(mp_reader_t *reader, byte **out);
152 
153 #if MICROPY_EMIT_MACHINE_CODE
154 
155 typedef struct _reloc_info_t {
156     mp_reader_t *reader;
157     mp_uint_t *const_table;
158 } reloc_info_t;
159 
160 #if MICROPY_EMIT_THUMB
asm_thumb_rewrite_mov(uint8_t * pc,uint16_t val)161 STATIC void asm_thumb_rewrite_mov(uint8_t *pc, uint16_t val) {
162     // high part
163     *(uint16_t *)pc = (*(uint16_t *)pc & 0xfbf0) | (val >> 1 & 0x0400) | (val >> 12);
164     // low part
165     *(uint16_t *)(pc + 2) = (*(uint16_t *)(pc + 2) & 0x0f00) | (val << 4 & 0x7000) | (val & 0x00ff);
166 
167 }
168 #endif
169 
arch_link_qstr(uint8_t * pc,bool is_obj,qstr qst)170 STATIC void arch_link_qstr(uint8_t *pc, bool is_obj, qstr qst) {
171     mp_uint_t val = qst;
172     if (is_obj) {
173         val = (mp_uint_t)MP_OBJ_NEW_QSTR(qst);
174     }
175     #if MICROPY_EMIT_X86 || MICROPY_EMIT_X64 || MICROPY_EMIT_ARM || MICROPY_EMIT_XTENSA || MICROPY_EMIT_XTENSAWIN
176     pc[0] = val & 0xff;
177     pc[1] = (val >> 8) & 0xff;
178     pc[2] = (val >> 16) & 0xff;
179     pc[3] = (val >> 24) & 0xff;
180     #elif MICROPY_EMIT_THUMB
181     if (is_obj) {
182         // qstr object, movw and movt
183         asm_thumb_rewrite_mov(pc, val); // movw
184         asm_thumb_rewrite_mov(pc + 4, val >> 16); // movt
185     } else {
186         // qstr number, movw instruction
187         asm_thumb_rewrite_mov(pc, val); // movw
188     }
189     #endif
190 }
191 
mp_native_relocate(void * ri_in,uint8_t * text,uintptr_t reloc_text)192 void mp_native_relocate(void *ri_in, uint8_t *text, uintptr_t reloc_text) {
193     // Relocate native code
194     reloc_info_t *ri = ri_in;
195     uint8_t op;
196     uintptr_t *addr_to_adjust = NULL;
197     while ((op = read_byte(ri->reader)) != 0xff) {
198         if (op & 1) {
199             // Point to new location to make adjustments
200             size_t addr = read_uint(ri->reader, NULL);
201             if ((addr & 1) == 0) {
202                 // Point to somewhere in text
203                 addr_to_adjust = &((uintptr_t *)text)[addr >> 1];
204             } else {
205                 // Point to somewhere in rodata
206                 addr_to_adjust = &((uintptr_t *)ri->const_table[1])[addr >> 1];
207             }
208         }
209         op >>= 1;
210         uintptr_t dest;
211         size_t n = 1;
212         if (op <= 5) {
213             if (op & 1) {
214                 // Read in number of adjustments to make
215                 n = read_uint(ri->reader, NULL);
216             }
217             op >>= 1;
218             if (op == 0) {
219                 // Destination is text
220                 dest = reloc_text;
221             } else {
222                 // Destination is rodata (op=1) or bss (op=1 if no rodata, else op=2)
223                 dest = ri->const_table[op];
224             }
225         } else if (op == 6) {
226             // Destination is mp_fun_table itself
227             dest = (uintptr_t)&mp_fun_table;
228         } else {
229             // Destination is an entry in mp_fun_table
230             dest = ((uintptr_t *)&mp_fun_table)[op - 7];
231         }
232         while (n--) {
233             *addr_to_adjust++ += dest;
234         }
235     }
236 }
237 
238 #endif
239 
read_byte(mp_reader_t * reader)240 STATIC int read_byte(mp_reader_t *reader) {
241     return reader->readbyte(reader->data);
242 }
243 
read_bytes(mp_reader_t * reader,byte * buf,size_t len)244 STATIC void read_bytes(mp_reader_t *reader, byte *buf, size_t len) {
245     while (len-- > 0) {
246         *buf++ = reader->readbyte(reader->data);
247     }
248 }
249 
read_uint(mp_reader_t * reader,byte ** out)250 STATIC size_t read_uint(mp_reader_t *reader, byte **out) {
251     size_t unum = 0;
252     for (;;) {
253         byte b = reader->readbyte(reader->data);
254         if (out != NULL) {
255             **out = b;
256             ++*out;
257         }
258         unum = (unum << 7) | (b & 0x7f);
259         if ((b & 0x80) == 0) {
260             break;
261         }
262     }
263     return unum;
264 }
265 
load_qstr(mp_reader_t * reader,qstr_window_t * qw)266 STATIC qstr load_qstr(mp_reader_t *reader, qstr_window_t *qw) {
267     size_t len = read_uint(reader, NULL);
268     if (len == 0) {
269         // static qstr
270         return read_byte(reader);
271     }
272     if (len & 1) {
273         // qstr in window
274         return qstr_window_access(qw, len >> 1);
275     }
276     len >>= 1;
277     char *str = m_new(char, len);
278     read_bytes(reader, (byte *)str, len);
279     qstr qst = qstr_from_strn(str, len);
280     m_del(char, str, len);
281     qstr_window_push(qw, qst);
282     return qst;
283 }
284 
load_obj(mp_reader_t * reader)285 STATIC mp_obj_t load_obj(mp_reader_t *reader) {
286     byte obj_type = read_byte(reader);
287     if (obj_type == 'e') {
288         return MP_OBJ_FROM_PTR(&mp_const_ellipsis_obj);
289     } else {
290         size_t len = read_uint(reader, NULL);
291         vstr_t vstr;
292         vstr_init_len(&vstr, len);
293         read_bytes(reader, (byte *)vstr.buf, len);
294         if (obj_type == 's' || obj_type == 'b') {
295             return mp_obj_new_str_from_vstr(obj_type == 's' ? &mp_type_str : &mp_type_bytes, &vstr);
296         } else if (obj_type == 'i') {
297             return mp_parse_num_integer(vstr.buf, vstr.len, 10, NULL);
298         } else {
299             assert(obj_type == 'f' || obj_type == 'c');
300             return mp_parse_num_decimal(vstr.buf, vstr.len, obj_type == 'c', false, NULL);
301         }
302     }
303 }
304 
load_prelude_qstrs(mp_reader_t * reader,qstr_window_t * qw,byte * ip)305 STATIC void load_prelude_qstrs(mp_reader_t *reader, qstr_window_t *qw, byte *ip) {
306     qstr simple_name = load_qstr(reader, qw);
307     ip[0] = simple_name;
308     ip[1] = simple_name >> 8;
309     qstr source_file = load_qstr(reader, qw);
310     ip[2] = source_file;
311     ip[3] = source_file >> 8;
312 }
313 
load_prelude(mp_reader_t * reader,qstr_window_t * qw,byte ** ip,bytecode_prelude_t * prelude)314 STATIC void load_prelude(mp_reader_t *reader, qstr_window_t *qw, byte **ip, bytecode_prelude_t *prelude) {
315     // Read in the prelude header
316     byte *ip_read = *ip;
317     read_uint(reader, &ip_read);                    // read in n_state/etc (is effectively a var-uint)
318     read_uint(reader, &ip_read);                    // read in n_info/n_cell (is effectively a var-uint)
319 
320     // Prelude header has been read into *ip, now decode and extract values from it
321     extract_prelude((const byte **)ip, prelude);
322 
323     // Load qstrs in prelude
324     load_prelude_qstrs(reader, qw, ip_read);
325     ip_read += 4;
326 
327     // Read remaining code info
328     read_bytes(reader, ip_read, *ip - ip_read);
329 }
330 
load_bytecode(mp_reader_t * reader,qstr_window_t * qw,byte * ip,byte * ip_top)331 STATIC void load_bytecode(mp_reader_t *reader, qstr_window_t *qw, byte *ip, byte *ip_top) {
332     while (ip < ip_top) {
333         *ip = read_byte(reader);
334         size_t sz;
335         uint f = mp_opcode_format(ip, &sz, false);
336         ++ip;
337         --sz;
338         if (f == MP_BC_FORMAT_QSTR) {
339             qstr qst = load_qstr(reader, qw);
340             *ip++ = qst;
341             *ip++ = qst >> 8;
342             sz -= 2;
343         } else if (f == MP_BC_FORMAT_VAR_UINT) {
344             while ((*ip++ = read_byte(reader)) & 0x80) {
345             }
346         }
347         read_bytes(reader, ip, sz);
348         ip += sz;
349     }
350 }
351 
load_raw_code(mp_reader_t * reader,qstr_window_t * qw)352 STATIC mp_raw_code_t *load_raw_code(mp_reader_t *reader, qstr_window_t *qw) {
353     // Load function kind and data length
354     size_t kind_len = read_uint(reader, NULL);
355     int kind = (kind_len & 3) + MP_CODE_BYTECODE;
356     size_t fun_data_len = kind_len >> 2;
357 
358     #if !MICROPY_EMIT_MACHINE_CODE
359     if (kind != MP_CODE_BYTECODE) {
360         mp_raise_ValueError(MP_ERROR_TEXT("incompatible .mpy file"));
361     }
362     #endif
363 
364     uint8_t *fun_data = NULL;
365     bytecode_prelude_t prelude = {0};
366     #if MICROPY_EMIT_MACHINE_CODE
367     size_t prelude_offset = 0;
368     mp_uint_t type_sig = 0;
369     size_t n_qstr_link = 0;
370     #endif
371 
372     if (kind == MP_CODE_BYTECODE) {
373         // Allocate memory for the bytecode
374         fun_data = m_new(uint8_t, fun_data_len);
375 
376         // Load prelude
377         byte *ip = fun_data;
378         load_prelude(reader, qw, &ip, &prelude);
379 
380         // Load bytecode
381         load_bytecode(reader, qw, ip, fun_data + fun_data_len);
382 
383     #if MICROPY_EMIT_MACHINE_CODE
384     } else {
385         // Allocate memory for native data and load it
386         size_t fun_alloc;
387         MP_PLAT_ALLOC_EXEC(fun_data_len, (void **)&fun_data, &fun_alloc);
388         read_bytes(reader, fun_data, fun_data_len);
389 
390         if (kind == MP_CODE_NATIVE_PY || kind == MP_CODE_NATIVE_VIPER) {
391             // Parse qstr link table and link native code
392             n_qstr_link = read_uint(reader, NULL);
393             for (size_t i = 0; i < n_qstr_link; ++i) {
394                 size_t off = read_uint(reader, NULL);
395                 qstr qst = load_qstr(reader, qw);
396                 uint8_t *dest = fun_data + (off >> 2);
397                 if ((off & 3) == 0) {
398                     // Generic 16-bit link
399                     dest[0] = qst & 0xff;
400                     dest[1] = (qst >> 8) & 0xff;
401                 } else if ((off & 3) == 3) {
402                     // Generic, aligned qstr-object link
403                     *(mp_obj_t *)dest = MP_OBJ_NEW_QSTR(qst);
404                 } else {
405                     // Architecture-specific link
406                     arch_link_qstr(dest, (off & 3) == 2, qst);
407                 }
408             }
409         }
410 
411         if (kind == MP_CODE_NATIVE_PY) {
412             // Extract prelude for later use
413             prelude_offset = read_uint(reader, NULL);
414             const byte *ip = fun_data + prelude_offset;
415             byte *ip_info = extract_prelude(&ip, &prelude);
416             // Load qstrs in prelude
417             load_prelude_qstrs(reader, qw, ip_info);
418         } else {
419             // Load basic scope info for viper and asm
420             prelude.scope_flags = read_uint(reader, NULL);
421             prelude.n_pos_args = 0;
422             prelude.n_kwonly_args = 0;
423             if (kind == MP_CODE_NATIVE_ASM) {
424                 prelude.n_pos_args = read_uint(reader, NULL);
425                 type_sig = read_uint(reader, NULL);
426             }
427         }
428     #endif
429     }
430 
431     size_t n_obj = 0;
432     size_t n_raw_code = 0;
433     mp_uint_t *const_table = NULL;
434 
435     if (kind != MP_CODE_NATIVE_ASM) {
436         // Load constant table for bytecode, native and viper
437 
438         // Number of entries in constant table
439         n_obj = read_uint(reader, NULL);
440         n_raw_code = read_uint(reader, NULL);
441 
442         // Allocate constant table
443         size_t n_alloc = prelude.n_pos_args + prelude.n_kwonly_args + n_obj + n_raw_code;
444         #if MICROPY_EMIT_MACHINE_CODE
445         if (kind != MP_CODE_BYTECODE) {
446             ++n_alloc; // additional entry for mp_fun_table
447             if (prelude.scope_flags & MP_SCOPE_FLAG_VIPERRODATA) {
448                 ++n_alloc; // additional entry for rodata
449             }
450             if (prelude.scope_flags & MP_SCOPE_FLAG_VIPERBSS) {
451                 ++n_alloc; // additional entry for BSS
452             }
453         }
454         #endif
455 
456         const_table = m_new(mp_uint_t, n_alloc);
457         mp_uint_t *ct = const_table;
458 
459         // Load function argument names (initial entries in const_table)
460         // (viper has n_pos_args=n_kwonly_args=0 so doesn't load any qstrs here)
461         for (size_t i = 0; i < prelude.n_pos_args + prelude.n_kwonly_args; ++i) {
462             *ct++ = (mp_uint_t)MP_OBJ_NEW_QSTR(load_qstr(reader, qw));
463         }
464 
465         #if MICROPY_EMIT_MACHINE_CODE
466         if (kind != MP_CODE_BYTECODE) {
467             // Populate mp_fun_table entry
468             *ct++ = (mp_uint_t)(uintptr_t)&mp_fun_table;
469 
470             // Allocate and load rodata if needed
471             if (prelude.scope_flags & MP_SCOPE_FLAG_VIPERRODATA) {
472                 size_t size = read_uint(reader, NULL);
473                 uint8_t *rodata = m_new(uint8_t, size);
474                 read_bytes(reader, rodata, size);
475                 *ct++ = (uintptr_t)rodata;
476             }
477 
478             // Allocate BSS if needed
479             if (prelude.scope_flags & MP_SCOPE_FLAG_VIPERBSS) {
480                 size_t size = read_uint(reader, NULL);
481                 uint8_t *bss = m_new0(uint8_t, size);
482                 *ct++ = (uintptr_t)bss;
483             }
484         }
485         #endif
486 
487         // Load constant objects and raw code children
488         for (size_t i = 0; i < n_obj; ++i) {
489             *ct++ = (mp_uint_t)load_obj(reader);
490         }
491         for (size_t i = 0; i < n_raw_code; ++i) {
492             *ct++ = (mp_uint_t)(uintptr_t)load_raw_code(reader, qw);
493         }
494     }
495 
496     // Create raw_code and return it
497     mp_raw_code_t *rc = mp_emit_glue_new_raw_code();
498     if (kind == MP_CODE_BYTECODE) {
499         // Assign bytecode to raw code object
500         mp_emit_glue_assign_bytecode(rc, fun_data,
501             #if MICROPY_PERSISTENT_CODE_SAVE || MICROPY_DEBUG_PRINTERS
502             fun_data_len,
503             #endif
504             const_table,
505             #if MICROPY_PERSISTENT_CODE_SAVE
506             n_obj, n_raw_code,
507             #endif
508             prelude.scope_flags);
509 
510     #if MICROPY_EMIT_MACHINE_CODE
511     } else {
512         // Relocate and commit code to executable address space
513         reloc_info_t ri = {reader, const_table};
514         #if defined(MP_PLAT_COMMIT_EXEC)
515         void *opt_ri = (prelude.scope_flags & MP_SCOPE_FLAG_VIPERRELOC) ? &ri : NULL;
516         fun_data = MP_PLAT_COMMIT_EXEC(fun_data, fun_data_len, opt_ri);
517         #else
518         if (prelude.scope_flags & MP_SCOPE_FLAG_VIPERRELOC) {
519             #if MICROPY_PERSISTENT_CODE_TRACK_RELOC_CODE
520             // If native code needs relocations then it's not guaranteed that a pointer to
521             // the head of `buf` (containing the machine code) will be retained for the GC
522             // to trace.  This is because native functions can start inside `buf` and so
523             // it's possible that the only GC-reachable pointers are pointers inside `buf`.
524             // So put this `buf` on a list of reachable root pointers.
525             if (MP_STATE_PORT(track_reloc_code_list) == MP_OBJ_NULL) {
526                 MP_STATE_PORT(track_reloc_code_list) = mp_obj_new_list(0, NULL);
527             }
528             mp_obj_list_append(MP_STATE_PORT(track_reloc_code_list), MP_OBJ_FROM_PTR(fun_data));
529             #endif
530             // Do the relocations.
531             mp_native_relocate(&ri, fun_data, (uintptr_t)fun_data);
532         }
533         #endif
534 
535         // Assign native code to raw code object
536         mp_emit_glue_assign_native(rc, kind,
537             fun_data, fun_data_len, const_table,
538             #if MICROPY_PERSISTENT_CODE_SAVE
539             prelude_offset,
540             n_obj, n_raw_code,
541             n_qstr_link, NULL,
542             #endif
543             prelude.n_pos_args, prelude.scope_flags, type_sig);
544     #endif
545     }
546     return rc;
547 }
548 
mp_raw_code_load(mp_reader_t * reader)549 mp_raw_code_t *mp_raw_code_load(mp_reader_t *reader) {
550     byte header[4];
551     read_bytes(reader, header, sizeof(header));
552     if (header[0] != 'M'
553         || header[1] != MPY_VERSION
554         || MPY_FEATURE_DECODE_FLAGS(header[2]) != MPY_FEATURE_FLAGS
555         || header[3] > mp_small_int_bits()
556         || read_uint(reader, NULL) > QSTR_WINDOW_SIZE) {
557         mp_raise_ValueError(MP_ERROR_TEXT("incompatible .mpy file"));
558     }
559     if (MPY_FEATURE_DECODE_ARCH(header[2]) != MP_NATIVE_ARCH_NONE) {
560         byte arch = MPY_FEATURE_DECODE_ARCH(header[2]);
561         if (!MPY_FEATURE_ARCH_TEST(arch)) {
562             mp_raise_ValueError(MP_ERROR_TEXT("incompatible .mpy arch"));
563         }
564     }
565     qstr_window_t qw;
566     qw.idx = 0;
567     mp_raw_code_t *rc = load_raw_code(reader, &qw);
568     reader->close(reader->data);
569     return rc;
570 }
571 
mp_raw_code_load_mem(const byte * buf,size_t len)572 mp_raw_code_t *mp_raw_code_load_mem(const byte *buf, size_t len) {
573     mp_reader_t reader;
574     mp_reader_new_mem(&reader, buf, len, 0);
575     return mp_raw_code_load(&reader);
576 }
577 
578 #if MICROPY_HAS_FILE_READER
579 
mp_raw_code_load_file(const char * filename)580 mp_raw_code_t *mp_raw_code_load_file(const char *filename) {
581     mp_reader_t reader;
582     mp_reader_new_file(&reader, filename);
583     return mp_raw_code_load(&reader);
584 }
585 
586 #endif // MICROPY_HAS_FILE_READER
587 
588 #endif // MICROPY_PERSISTENT_CODE_LOAD
589 
590 #if MICROPY_PERSISTENT_CODE_SAVE
591 
592 #include "py/objstr.h"
593 
mp_print_bytes(mp_print_t * print,const byte * data,size_t len)594 STATIC void mp_print_bytes(mp_print_t *print, const byte *data, size_t len) {
595     print->print_strn(print->data, (const char *)data, len);
596 }
597 
598 #define BYTES_FOR_INT ((MP_BYTES_PER_OBJ_WORD * 8 + 6) / 7)
mp_print_uint(mp_print_t * print,size_t n)599 STATIC void mp_print_uint(mp_print_t *print, size_t n) {
600     byte buf[BYTES_FOR_INT];
601     byte *p = buf + sizeof(buf);
602     *--p = n & 0x7f;
603     n >>= 7;
604     for (; n != 0; n >>= 7) {
605         *--p = 0x80 | (n & 0x7f);
606     }
607     print->print_strn(print->data, (char *)p, buf + sizeof(buf) - p);
608 }
609 
save_qstr(mp_print_t * print,qstr_window_t * qw,qstr qst)610 STATIC void save_qstr(mp_print_t *print, qstr_window_t *qw, qstr qst) {
611     if (qst <= QSTR_LAST_STATIC) {
612         // encode static qstr
613         byte buf[2] = {0, qst & 0xff};
614         mp_print_bytes(print, buf, 2);
615         return;
616     }
617     size_t idx = qstr_window_insert(qw, qst);
618     if (idx < QSTR_WINDOW_SIZE) {
619         // qstr found in window, encode index to it
620         mp_print_uint(print, idx << 1 | 1);
621         return;
622     }
623     size_t len;
624     const byte *str = qstr_data(qst, &len);
625     mp_print_uint(print, len << 1);
626     mp_print_bytes(print, str, len);
627 }
628 
save_obj(mp_print_t * print,mp_obj_t o)629 STATIC void save_obj(mp_print_t *print, mp_obj_t o) {
630     if (mp_obj_is_str_or_bytes(o)) {
631         byte obj_type;
632         if (mp_obj_is_str(o)) {
633             obj_type = 's';
634         } else {
635             obj_type = 'b';
636         }
637         size_t len;
638         const char *str = mp_obj_str_get_data(o, &len);
639         mp_print_bytes(print, &obj_type, 1);
640         mp_print_uint(print, len);
641         mp_print_bytes(print, (const byte *)str, len);
642     } else if (MP_OBJ_TO_PTR(o) == &mp_const_ellipsis_obj) {
643         byte obj_type = 'e';
644         mp_print_bytes(print, &obj_type, 1);
645     } else {
646         // we save numbers using a simplistic text representation
647         // TODO could be improved
648         byte obj_type;
649         if (mp_obj_is_type(o, &mp_type_int)) {
650             obj_type = 'i';
651         #if MICROPY_PY_BUILTINS_COMPLEX
652         } else if (mp_obj_is_type(o, &mp_type_complex)) {
653             obj_type = 'c';
654         #endif
655         } else {
656             assert(mp_obj_is_float(o));
657             obj_type = 'f';
658         }
659         vstr_t vstr;
660         mp_print_t pr;
661         vstr_init_print(&vstr, 10, &pr);
662         mp_obj_print_helper(&pr, o, PRINT_REPR);
663         mp_print_bytes(print, &obj_type, 1);
664         mp_print_uint(print, vstr.len);
665         mp_print_bytes(print, (const byte *)vstr.buf, vstr.len);
666         vstr_clear(&vstr);
667     }
668 }
669 
save_prelude_qstrs(mp_print_t * print,qstr_window_t * qw,const byte * ip)670 STATIC void save_prelude_qstrs(mp_print_t *print, qstr_window_t *qw, const byte *ip) {
671     save_qstr(print, qw, ip[0] | (ip[1] << 8)); // simple_name
672     save_qstr(print, qw, ip[2] | (ip[3] << 8)); // source_file
673 }
674 
save_bytecode(mp_print_t * print,qstr_window_t * qw,const byte * ip,const byte * ip_top)675 STATIC void save_bytecode(mp_print_t *print, qstr_window_t *qw, const byte *ip, const byte *ip_top) {
676     while (ip < ip_top) {
677         size_t sz;
678         uint f = mp_opcode_format(ip, &sz, true);
679         if (f == MP_BC_FORMAT_QSTR) {
680             mp_print_bytes(print, ip, 1);
681             qstr qst = ip[1] | (ip[2] << 8);
682             save_qstr(print, qw, qst);
683             ip += 3;
684             sz -= 3;
685         }
686         mp_print_bytes(print, ip, sz);
687         ip += sz;
688     }
689 }
690 
save_raw_code(mp_print_t * print,mp_raw_code_t * rc,qstr_window_t * qstr_window)691 STATIC void save_raw_code(mp_print_t *print, mp_raw_code_t *rc, qstr_window_t *qstr_window) {
692     // Save function kind and data length
693     mp_print_uint(print, (rc->fun_data_len << 2) | (rc->kind - MP_CODE_BYTECODE));
694 
695     bytecode_prelude_t prelude;
696 
697     if (rc->kind == MP_CODE_BYTECODE) {
698         // Extract prelude
699         const byte *ip = rc->fun_data;
700         const byte *ip_info = extract_prelude(&ip, &prelude);
701 
702         // Save prelude
703         mp_print_bytes(print, rc->fun_data, ip_info - (const byte *)rc->fun_data);
704         save_prelude_qstrs(print, qstr_window, ip_info);
705         ip_info += 4;
706         mp_print_bytes(print, ip_info, ip - ip_info);
707 
708         // Save bytecode
709         const byte *ip_top = (const byte *)rc->fun_data + rc->fun_data_len;
710         save_bytecode(print, qstr_window, ip, ip_top);
711     #if MICROPY_EMIT_MACHINE_CODE
712     } else {
713         // Save native code
714         mp_print_bytes(print, rc->fun_data, rc->fun_data_len);
715 
716         if (rc->kind == MP_CODE_NATIVE_PY || rc->kind == MP_CODE_NATIVE_VIPER) {
717             // Save qstr link table for native code
718             mp_print_uint(print, rc->n_qstr);
719             for (size_t i = 0; i < rc->n_qstr; ++i) {
720                 mp_print_uint(print, rc->qstr_link[i].off);
721                 save_qstr(print, qstr_window, rc->qstr_link[i].qst);
722             }
723         }
724 
725         if (rc->kind == MP_CODE_NATIVE_PY) {
726             // Save prelude size
727             mp_print_uint(print, rc->prelude_offset);
728 
729             // Extract prelude and save qstrs in prelude
730             const byte *ip = (const byte *)rc->fun_data + rc->prelude_offset;
731             const byte *ip_info = extract_prelude(&ip, &prelude);
732             save_prelude_qstrs(print, qstr_window, ip_info);
733         } else {
734             // Save basic scope info for viper and asm
735             mp_print_uint(print, rc->scope_flags & MP_SCOPE_FLAG_ALL_SIG);
736             prelude.n_pos_args = 0;
737             prelude.n_kwonly_args = 0;
738             if (rc->kind == MP_CODE_NATIVE_ASM) {
739                 mp_print_uint(print, rc->n_pos_args);
740                 mp_print_uint(print, rc->type_sig);
741             }
742         }
743     #endif
744     }
745 
746     if (rc->kind != MP_CODE_NATIVE_ASM) {
747         // Save constant table for bytecode, native and viper
748 
749         // Number of entries in constant table
750         mp_print_uint(print, rc->n_obj);
751         mp_print_uint(print, rc->n_raw_code);
752 
753         const mp_uint_t *const_table = rc->const_table;
754 
755         // Save function argument names (initial entries in const_table)
756         // (viper has n_pos_args=n_kwonly_args=0 so doesn't save any qstrs here)
757         for (size_t i = 0; i < prelude.n_pos_args + prelude.n_kwonly_args; ++i) {
758             mp_obj_t o = (mp_obj_t)*const_table++;
759             save_qstr(print, qstr_window, MP_OBJ_QSTR_VALUE(o));
760         }
761 
762         if (rc->kind != MP_CODE_BYTECODE) {
763             // Skip saving mp_fun_table entry
764             ++const_table;
765         }
766 
767         // Save constant objects and raw code children
768         for (size_t i = 0; i < rc->n_obj; ++i) {
769             save_obj(print, (mp_obj_t)*const_table++);
770         }
771         for (size_t i = 0; i < rc->n_raw_code; ++i) {
772             save_raw_code(print, (mp_raw_code_t *)(uintptr_t)*const_table++, qstr_window);
773         }
774     }
775 }
776 
mp_raw_code_has_native(mp_raw_code_t * rc)777 STATIC bool mp_raw_code_has_native(mp_raw_code_t *rc) {
778     if (rc->kind != MP_CODE_BYTECODE) {
779         return true;
780     }
781 
782     const byte *ip = rc->fun_data;
783     bytecode_prelude_t prelude;
784     extract_prelude(&ip, &prelude);
785 
786     const mp_uint_t *const_table = rc->const_table
787         + prelude.n_pos_args + prelude.n_kwonly_args
788         + rc->n_obj;
789 
790     for (size_t i = 0; i < rc->n_raw_code; ++i) {
791         if (mp_raw_code_has_native((mp_raw_code_t *)(uintptr_t)*const_table++)) {
792             return true;
793         }
794     }
795 
796     return false;
797 }
798 
mp_raw_code_save(mp_raw_code_t * rc,mp_print_t * print)799 void mp_raw_code_save(mp_raw_code_t *rc, mp_print_t *print) {
800     // header contains:
801     //  byte  'M'
802     //  byte  version
803     //  byte  feature flags
804     //  byte  number of bits in a small int
805     //  uint  size of qstr window
806     byte header[4] = {
807         'M',
808         MPY_VERSION,
809         MPY_FEATURE_ENCODE_FLAGS(MPY_FEATURE_FLAGS_DYNAMIC),
810         #if MICROPY_DYNAMIC_COMPILER
811         mp_dynamic_compiler.small_int_bits,
812         #else
813         mp_small_int_bits(),
814         #endif
815     };
816     if (mp_raw_code_has_native(rc)) {
817         header[2] |= MPY_FEATURE_ENCODE_ARCH(MPY_FEATURE_ARCH_DYNAMIC);
818     }
819     mp_print_bytes(print, header, sizeof(header));
820     mp_print_uint(print, QSTR_WINDOW_SIZE);
821 
822     qstr_window_t qw;
823     qw.idx = 0;
824     memset(qw.window, 0, sizeof(qw.window));
825     save_raw_code(print, rc, &qw);
826 }
827 
828 #if MICROPY_PERSISTENT_CODE_SAVE_FILE
829 
830 #include <unistd.h>
831 #include <sys/stat.h>
832 #include <fcntl.h>
833 
fd_print_strn(void * env,const char * str,size_t len)834 STATIC void fd_print_strn(void *env, const char *str, size_t len) {
835     int fd = (intptr_t)env;
836     MP_THREAD_GIL_EXIT();
837     ssize_t ret = write(fd, str, len);
838     MP_THREAD_GIL_ENTER();
839     (void)ret;
840 }
841 
mp_raw_code_save_file(mp_raw_code_t * rc,const char * filename)842 void mp_raw_code_save_file(mp_raw_code_t *rc, const char *filename) {
843     MP_THREAD_GIL_EXIT();
844     int fd = open(filename, O_WRONLY | O_CREAT | O_TRUNC, 0644);
845     MP_THREAD_GIL_ENTER();
846     mp_print_t fd_print = {(void *)(intptr_t)fd, fd_print_strn};
847     mp_raw_code_save(rc, &fd_print);
848     MP_THREAD_GIL_EXIT();
849     close(fd);
850     MP_THREAD_GIL_ENTER();
851 }
852 
853 #endif // MICROPY_PERSISTENT_CODE_SAVE_FILE
854 
855 #endif // MICROPY_PERSISTENT_CODE_SAVE
856