blob: 35f5f8243eebaa0ef5c0e0093108fb08b23c1b83 [file] [log] [blame]
Damien George04b91472014-05-03 23:27:38 +01001/*
2 * This file is part of the Micro Python project, http://micropython.org/
3 *
4 * The MIT License (MIT)
5 *
Damien George4735c452015-04-21 16:43:18 +00006 * Copyright (c) 2013-2015 Damien P. George
Damien George04b91472014-05-03 23:27:38 +01007 *
8 * Permission is hereby granted, free of charge, to any person obtaining a copy
9 * of this software and associated documentation files (the "Software"), to deal
10 * in the Software without restriction, including without limitation the rights
11 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
12 * copies of the Software, and to permit persons to whom the Software is
13 * furnished to do so, subject to the following conditions:
14 *
15 * The above copyright notice and this permission notice shall be included in
16 * all copies or substantial portions of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
21 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
22 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
23 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
24 * THE SOFTWARE.
25 */
26
xbeefe34222014-03-16 00:14:26 -070027#include <stdbool.h>
Damien429d7192013-10-04 19:53:11 +010028#include <stdint.h>
29#include <stdio.h>
Damien429d7192013-10-04 19:53:11 +010030#include <assert.h>
Damien George5042bce2014-05-25 22:06:06 +010031#include <string.h>
Damien429d7192013-10-04 19:53:11 +010032
Damien George0bfc7632015-02-07 18:33:58 +000033#include "py/nlr.h"
Damien George51dfcb42015-01-01 20:27:54 +000034#include "py/lexer.h"
35#include "py/parse.h"
36#include "py/parsenum.h"
37#include "py/smallint.h"
Damien429d7192013-10-04 19:53:11 +010038
Damien429d7192013-10-04 19:53:11 +010039#define RULE_ACT_ARG_MASK (0x0f)
Damien Georgeb47ea4e2014-12-20 18:37:50 +000040#define RULE_ACT_KIND_MASK (0x30)
41#define RULE_ACT_ALLOW_IDENT (0x40)
42#define RULE_ACT_ADD_BLANK (0x80)
Damien429d7192013-10-04 19:53:11 +010043#define RULE_ACT_OR (0x10)
44#define RULE_ACT_AND (0x20)
45#define RULE_ACT_LIST (0x30)
46
Damien429d7192013-10-04 19:53:11 +010047#define RULE_ARG_KIND_MASK (0xf000)
48#define RULE_ARG_ARG_MASK (0x0fff)
49#define RULE_ARG_TOK (0x1000)
50#define RULE_ARG_RULE (0x2000)
Damien George4735c452015-04-21 16:43:18 +000051#define RULE_ARG_OPT_RULE (0x3000)
Damien429d7192013-10-04 19:53:11 +010052
Damien Georgeb47ea4e2014-12-20 18:37:50 +000053#define ADD_BLANK_NODE(rule) ((rule->act & RULE_ACT_ADD_BLANK) != 0)
Damien Georgeb829b5c2014-01-25 13:51:19 +000054
Damien429d7192013-10-04 19:53:11 +010055// (un)comment to use rule names; for debugging
56//#define USE_RULE_NAME (1)
57
58typedef struct _rule_t {
59 byte rule_id;
60 byte act;
61#ifdef USE_RULE_NAME
62 const char *rule_name;
63#endif
64 uint16_t arg[];
65} rule_t;
66
67enum {
Damien George00208ce2014-01-23 00:00:53 +000068#define DEF_RULE(rule, comp, kind, ...) RULE_##rule,
Damien George51dfcb42015-01-01 20:27:54 +000069#include "py/grammar.h"
Damien429d7192013-10-04 19:53:11 +010070#undef DEF_RULE
71 RULE_maximum_number_of,
Damien George5042bce2014-05-25 22:06:06 +010072 RULE_string, // special node for non-interned string
Damien George4c81ba82015-01-13 16:21:23 +000073 RULE_bytes, // special node for non-interned bytes
Damien George7d414a12015-02-08 01:57:40 +000074 RULE_const_object, // special node for a constant, generic Python object
Damien429d7192013-10-04 19:53:11 +010075};
76
Damien Georgeb47ea4e2014-12-20 18:37:50 +000077#define ident (RULE_ACT_ALLOW_IDENT)
78#define blank (RULE_ACT_ADD_BLANK)
Damien429d7192013-10-04 19:53:11 +010079#define or(n) (RULE_ACT_OR | n)
80#define and(n) (RULE_ACT_AND | n)
81#define one_or_more (RULE_ACT_LIST | 2)
82#define list (RULE_ACT_LIST | 1)
83#define list_with_end (RULE_ACT_LIST | 3)
Damiend99b0522013-12-21 18:17:45 +000084#define tok(t) (RULE_ARG_TOK | MP_TOKEN_##t)
Damien429d7192013-10-04 19:53:11 +010085#define rule(r) (RULE_ARG_RULE | RULE_##r)
Damien429d7192013-10-04 19:53:11 +010086#define opt_rule(r) (RULE_ARG_OPT_RULE | RULE_##r)
87#ifdef USE_RULE_NAME
Damien George00208ce2014-01-23 00:00:53 +000088#define DEF_RULE(rule, comp, kind, ...) static const rule_t rule_##rule = { RULE_##rule, kind, #rule, { __VA_ARGS__ } };
Damien429d7192013-10-04 19:53:11 +010089#else
Damien George00208ce2014-01-23 00:00:53 +000090#define DEF_RULE(rule, comp, kind, ...) static const rule_t rule_##rule = { RULE_##rule, kind, { __VA_ARGS__ } };
Damien429d7192013-10-04 19:53:11 +010091#endif
Damien George51dfcb42015-01-01 20:27:54 +000092#include "py/grammar.h"
Damien429d7192013-10-04 19:53:11 +010093#undef or
94#undef and
95#undef list
96#undef list_with_end
97#undef tok
98#undef rule
Damien429d7192013-10-04 19:53:11 +010099#undef opt_rule
100#undef one_or_more
101#undef DEF_RULE
102
Paul Sokolovsky520e2f52014-02-12 18:31:30 +0200103STATIC const rule_t *rules[] = {
Damien George00208ce2014-01-23 00:00:53 +0000104#define DEF_RULE(rule, comp, kind, ...) &rule_##rule,
Damien George51dfcb42015-01-01 20:27:54 +0000105#include "py/grammar.h"
Damien429d7192013-10-04 19:53:11 +0100106#undef DEF_RULE
107};
108
109typedef struct _rule_stack_t {
Damien George5c670ac2015-01-24 23:12:58 +0000110 mp_uint_t src_line : BITS_PER_WORD - 8; // maximum bits storing source line number
111 mp_uint_t rule_id : 8; // this must be large enough to fit largest rule number
112 mp_uint_t arg_i; // this dictates the maximum nodes in a "list" of things
Damien429d7192013-10-04 19:53:11 +0100113} rule_stack_t;
114
115typedef struct _parser_t {
Damien George58ba4c32014-04-10 14:27:31 +0000116 bool had_memory_error;
117
Damien George38161822014-07-03 14:13:33 +0100118 mp_uint_t rule_stack_alloc;
119 mp_uint_t rule_stack_top;
Damien429d7192013-10-04 19:53:11 +0100120 rule_stack_t *rule_stack;
121
Damien George38161822014-07-03 14:13:33 +0100122 mp_uint_t result_stack_alloc;
123 mp_uint_t result_stack_top;
Damiend99b0522013-12-21 18:17:45 +0000124 mp_parse_node_t *result_stack;
Damien George08335002014-01-18 23:24:36 +0000125
126 mp_lexer_t *lexer;
Damien429d7192013-10-04 19:53:11 +0100127} parser_t;
128
Damien George58ba4c32014-04-10 14:27:31 +0000129STATIC inline void memory_error(parser_t *parser) {
130 parser->had_memory_error = true;
131}
132
Damien George38161822014-07-03 14:13:33 +0100133STATIC void push_rule(parser_t *parser, mp_uint_t src_line, const rule_t *rule, mp_uint_t arg_i) {
Damien George58ba4c32014-04-10 14:27:31 +0000134 if (parser->had_memory_error) {
135 return;
136 }
Damien429d7192013-10-04 19:53:11 +0100137 if (parser->rule_stack_top >= parser->rule_stack_alloc) {
Damien George58ebde42014-05-21 20:32:59 +0100138 rule_stack_t *rs = m_renew_maybe(rule_stack_t, parser->rule_stack, parser->rule_stack_alloc, parser->rule_stack_alloc + MICROPY_ALLOC_PARSE_RULE_INC);
Damien George58ba4c32014-04-10 14:27:31 +0000139 if (rs == NULL) {
140 memory_error(parser);
141 return;
142 }
143 parser->rule_stack = rs;
Damien George58ebde42014-05-21 20:32:59 +0100144 parser->rule_stack_alloc += MICROPY_ALLOC_PARSE_RULE_INC;
Damien429d7192013-10-04 19:53:11 +0100145 }
Damien George08335002014-01-18 23:24:36 +0000146 rule_stack_t *rs = &parser->rule_stack[parser->rule_stack_top++];
147 rs->src_line = src_line;
148 rs->rule_id = rule->rule_id;
149 rs->arg_i = arg_i;
Damien429d7192013-10-04 19:53:11 +0100150}
151
Damien George38161822014-07-03 14:13:33 +0100152STATIC void push_rule_from_arg(parser_t *parser, mp_uint_t arg) {
Damien429d7192013-10-04 19:53:11 +0100153 assert((arg & RULE_ARG_KIND_MASK) == RULE_ARG_RULE || (arg & RULE_ARG_KIND_MASK) == RULE_ARG_OPT_RULE);
Damien George38161822014-07-03 14:13:33 +0100154 mp_uint_t rule_id = arg & RULE_ARG_ARG_MASK;
Damien429d7192013-10-04 19:53:11 +0100155 assert(rule_id < RULE_maximum_number_of);
Damien Georgea4c52c52014-12-05 19:35:18 +0000156 push_rule(parser, parser->lexer->tok_line, rules[rule_id], 0);
Damien429d7192013-10-04 19:53:11 +0100157}
158
Damien George38161822014-07-03 14:13:33 +0100159STATIC void pop_rule(parser_t *parser, const rule_t **rule, mp_uint_t *arg_i, mp_uint_t *src_line) {
Damien George58ba4c32014-04-10 14:27:31 +0000160 assert(!parser->had_memory_error);
Damien429d7192013-10-04 19:53:11 +0100161 parser->rule_stack_top -= 1;
162 *rule = rules[parser->rule_stack[parser->rule_stack_top].rule_id];
163 *arg_i = parser->rule_stack[parser->rule_stack_top].arg_i;
Damien George08335002014-01-18 23:24:36 +0000164 *src_line = parser->rule_stack[parser->rule_stack_top].src_line;
Damien429d7192013-10-04 19:53:11 +0100165}
166
Damien George40f3c022014-07-03 13:25:24 +0100167mp_parse_node_t mp_parse_node_new_leaf(mp_int_t kind, mp_int_t arg) {
Paul Sokolovsky56e5ef22014-02-22 16:39:45 +0200168 if (kind == MP_PARSE_NODE_SMALL_INT) {
169 return (mp_parse_node_t)(kind | (arg << 1));
170 }
Damien George7d414a12015-02-08 01:57:40 +0000171 return (mp_parse_node_t)(kind | (arg << 4));
Damien429d7192013-10-04 19:53:11 +0100172}
173
Damien George5042bce2014-05-25 22:06:06 +0100174void mp_parse_node_free(mp_parse_node_t pn) {
Damien Georgeb829b5c2014-01-25 13:51:19 +0000175 if (MP_PARSE_NODE_IS_STRUCT(pn)) {
176 mp_parse_node_struct_t *pns = (mp_parse_node_struct_t *)pn;
Damien George38161822014-07-03 14:13:33 +0100177 mp_uint_t n = MP_PARSE_NODE_STRUCT_NUM_NODES(pns);
178 mp_uint_t rule_id = MP_PARSE_NODE_STRUCT_KIND(pns);
Damien George4c81ba82015-01-13 16:21:23 +0000179 if (rule_id == RULE_string || rule_id == RULE_bytes) {
Damien George52b5d762014-09-23 15:31:56 +0000180 m_del(char, (char*)pns->nodes[0], (mp_uint_t)pns->nodes[1]);
Damien George7d414a12015-02-08 01:57:40 +0000181 } else if (rule_id == RULE_const_object) {
182 // don't free the const object since it's probably used by the compiled code
Damien Georgee7bb0442014-10-23 14:13:05 +0100183 } else {
Damien Georgeb47ea4e2014-12-20 18:37:50 +0000184 bool adjust = ADD_BLANK_NODE(rules[rule_id]);
Damien Georgee7bb0442014-10-23 14:13:05 +0100185 if (adjust) {
186 n--;
187 }
188 for (mp_uint_t i = 0; i < n; i++) {
189 mp_parse_node_free(pns->nodes[i]);
190 }
191 if (adjust) {
192 n++;
193 }
Damien Georgeb829b5c2014-01-25 13:51:19 +0000194 }
195 m_del_var(mp_parse_node_struct_t, mp_parse_node_t, n, pns);
Paul Sokolovskyaee2ba72014-01-25 00:56:19 +0200196 }
Paul Sokolovskyaee2ba72014-01-25 00:56:19 +0200197}
198
Damien Georgedfe944c2015-02-13 02:29:46 +0000199int mp_parse_node_extract_list(mp_parse_node_t *pn, mp_uint_t pn_kind, mp_parse_node_t **nodes) {
200 if (MP_PARSE_NODE_IS_NULL(*pn)) {
201 *nodes = NULL;
202 return 0;
203 } else if (MP_PARSE_NODE_IS_LEAF(*pn)) {
204 *nodes = pn;
205 return 1;
206 } else {
207 mp_parse_node_struct_t *pns = (mp_parse_node_struct_t*)(*pn);
208 if (MP_PARSE_NODE_STRUCT_KIND(pns) != pn_kind) {
209 *nodes = pn;
210 return 1;
211 } else {
212 *nodes = pns->nodes;
213 return MP_PARSE_NODE_STRUCT_NUM_NODES(pns);
214 }
215 }
216}
217
Damien Georgecbd2f742014-01-19 11:48:48 +0000218#if MICROPY_DEBUG_PRINTERS
Damien George38161822014-07-03 14:13:33 +0100219void mp_parse_node_print(mp_parse_node_t pn, mp_uint_t indent) {
Damien George08335002014-01-18 23:24:36 +0000220 if (MP_PARSE_NODE_IS_STRUCT(pn)) {
221 printf("[% 4d] ", (int)((mp_parse_node_struct_t*)pn)->source_line);
222 } else {
223 printf(" ");
224 }
Damien George38161822014-07-03 14:13:33 +0100225 for (mp_uint_t i = 0; i < indent; i++) {
Damien429d7192013-10-04 19:53:11 +0100226 printf(" ");
227 }
Damiend99b0522013-12-21 18:17:45 +0000228 if (MP_PARSE_NODE_IS_NULL(pn)) {
Damien429d7192013-10-04 19:53:11 +0100229 printf("NULL\n");
Paul Sokolovsky56e5ef22014-02-22 16:39:45 +0200230 } else if (MP_PARSE_NODE_IS_SMALL_INT(pn)) {
Damien George40f3c022014-07-03 13:25:24 +0100231 mp_int_t arg = MP_PARSE_NODE_LEAF_SMALL_INT(pn);
Paul Sokolovsky56e5ef22014-02-22 16:39:45 +0200232 printf("int(" INT_FMT ")\n", arg);
Damiend99b0522013-12-21 18:17:45 +0000233 } else if (MP_PARSE_NODE_IS_LEAF(pn)) {
Damien George40f3c022014-07-03 13:25:24 +0100234 mp_uint_t arg = MP_PARSE_NODE_LEAF_ARG(pn);
Damiend99b0522013-12-21 18:17:45 +0000235 switch (MP_PARSE_NODE_LEAF_KIND(pn)) {
236 case MP_PARSE_NODE_ID: printf("id(%s)\n", qstr_str(arg)); break;
Damiend99b0522013-12-21 18:17:45 +0000237 case MP_PARSE_NODE_STRING: printf("str(%s)\n", qstr_str(arg)); break;
238 case MP_PARSE_NODE_BYTES: printf("bytes(%s)\n", qstr_str(arg)); break;
Damien George08d07552014-01-29 18:58:52 +0000239 case MP_PARSE_NODE_TOKEN: printf("tok(" INT_FMT ")\n", arg); break;
Damien429d7192013-10-04 19:53:11 +0100240 default: assert(0);
241 }
242 } else {
Damien George5042bce2014-05-25 22:06:06 +0100243 // node must be a mp_parse_node_struct_t
Damien Georgeb829b5c2014-01-25 13:51:19 +0000244 mp_parse_node_struct_t *pns = (mp_parse_node_struct_t*)pn;
Damien George5042bce2014-05-25 22:06:06 +0100245 if (MP_PARSE_NODE_STRUCT_KIND(pns) == RULE_string) {
246 printf("literal str(%.*s)\n", (int)pns->nodes[1], (char*)pns->nodes[0]);
Damien George4c81ba82015-01-13 16:21:23 +0000247 } else if (MP_PARSE_NODE_STRUCT_KIND(pns) == RULE_bytes) {
248 printf("literal bytes(%.*s)\n", (int)pns->nodes[1], (char*)pns->nodes[0]);
Damien George7d414a12015-02-08 01:57:40 +0000249 } else if (MP_PARSE_NODE_STRUCT_KIND(pns) == RULE_const_object) {
250 printf("literal const(%p)\n", (mp_obj_t)pns->nodes[0]);
Damien George5042bce2014-05-25 22:06:06 +0100251 } else {
Damien George38161822014-07-03 14:13:33 +0100252 mp_uint_t n = MP_PARSE_NODE_STRUCT_NUM_NODES(pns);
Damien429d7192013-10-04 19:53:11 +0100253#ifdef USE_RULE_NAME
Damien George38161822014-07-03 14:13:33 +0100254 printf("%s(" UINT_FMT ") (n=" UINT_FMT ")\n", rules[MP_PARSE_NODE_STRUCT_KIND(pns)]->rule_name, (mp_uint_t)MP_PARSE_NODE_STRUCT_KIND(pns), n);
Damien429d7192013-10-04 19:53:11 +0100255#else
Damien George38161822014-07-03 14:13:33 +0100256 printf("rule(" UINT_FMT ") (n=" UINT_FMT ")\n", (mp_uint_t)MP_PARSE_NODE_STRUCT_KIND(pns), n);
Damien429d7192013-10-04 19:53:11 +0100257#endif
Damien George38161822014-07-03 14:13:33 +0100258 for (mp_uint_t i = 0; i < n; i++) {
Damien George5042bce2014-05-25 22:06:06 +0100259 mp_parse_node_print(pns->nodes[i], indent + 2);
260 }
Damien429d7192013-10-04 19:53:11 +0100261 }
262 }
263}
Damien Georgecbd2f742014-01-19 11:48:48 +0000264#endif // MICROPY_DEBUG_PRINTERS
Damien429d7192013-10-04 19:53:11 +0100265
266/*
Paul Sokolovsky520e2f52014-02-12 18:31:30 +0200267STATIC void result_stack_show(parser_t *parser) {
Damien429d7192013-10-04 19:53:11 +0100268 printf("result stack, most recent first\n");
Damien George38161822014-07-03 14:13:33 +0100269 for (mp_int_t i = parser->result_stack_top - 1; i >= 0; i--) {
Damien Georgecbd2f742014-01-19 11:48:48 +0000270 mp_parse_node_print(parser->result_stack[i], 0);
Damien429d7192013-10-04 19:53:11 +0100271 }
272}
273*/
274
Paul Sokolovsky520e2f52014-02-12 18:31:30 +0200275STATIC mp_parse_node_t pop_result(parser_t *parser) {
Damien George58ba4c32014-04-10 14:27:31 +0000276 if (parser->had_memory_error) {
277 return MP_PARSE_NODE_NULL;
278 }
Damien429d7192013-10-04 19:53:11 +0100279 assert(parser->result_stack_top > 0);
280 return parser->result_stack[--parser->result_stack_top];
281}
282
Damien George38161822014-07-03 14:13:33 +0100283STATIC mp_parse_node_t peek_result(parser_t *parser, mp_uint_t pos) {
Damien George58ba4c32014-04-10 14:27:31 +0000284 if (parser->had_memory_error) {
285 return MP_PARSE_NODE_NULL;
286 }
Damien429d7192013-10-04 19:53:11 +0100287 assert(parser->result_stack_top > pos);
288 return parser->result_stack[parser->result_stack_top - 1 - pos];
289}
290
Paul Sokolovsky520e2f52014-02-12 18:31:30 +0200291STATIC void push_result_node(parser_t *parser, mp_parse_node_t pn) {
Damien George58ba4c32014-04-10 14:27:31 +0000292 if (parser->had_memory_error) {
293 return;
294 }
Damien George69a818d2014-01-12 13:55:24 +0000295 if (parser->result_stack_top >= parser->result_stack_alloc) {
Damien George50912e72015-01-20 11:55:10 +0000296 mp_parse_node_t *stack = m_renew_maybe(mp_parse_node_t, parser->result_stack, parser->result_stack_alloc, parser->result_stack_alloc + MICROPY_ALLOC_PARSE_RESULT_INC);
297 if (stack == NULL) {
Damien George58ba4c32014-04-10 14:27:31 +0000298 memory_error(parser);
299 return;
300 }
Damien George50912e72015-01-20 11:55:10 +0000301 parser->result_stack = stack;
Damien George58ebde42014-05-21 20:32:59 +0100302 parser->result_stack_alloc += MICROPY_ALLOC_PARSE_RESULT_INC;
Damien George69a818d2014-01-12 13:55:24 +0000303 }
Damien429d7192013-10-04 19:53:11 +0100304 parser->result_stack[parser->result_stack_top++] = pn;
305}
306
Damien George7d414a12015-02-08 01:57:40 +0000307STATIC mp_parse_node_t make_node_string_bytes(parser_t *parser, mp_uint_t src_line, mp_uint_t rule_kind, const char *str, mp_uint_t len) {
Damien George5042bce2014-05-25 22:06:06 +0100308 mp_parse_node_struct_t *pn = m_new_obj_var_maybe(mp_parse_node_struct_t, mp_parse_node_t, 2);
309 if (pn == NULL) {
310 memory_error(parser);
Damien George7d414a12015-02-08 01:57:40 +0000311 return MP_PARSE_NODE_NULL;
Damien George5042bce2014-05-25 22:06:06 +0100312 }
313 pn->source_line = src_line;
Damien George4c81ba82015-01-13 16:21:23 +0000314 pn->kind_num_nodes = rule_kind | (2 << 8);
Damien George5042bce2014-05-25 22:06:06 +0100315 char *p = m_new(char, len);
316 memcpy(p, str, len);
Damien George40f3c022014-07-03 13:25:24 +0100317 pn->nodes[0] = (mp_int_t)p;
Damien George5042bce2014-05-25 22:06:06 +0100318 pn->nodes[1] = len;
Damien George7d414a12015-02-08 01:57:40 +0000319 return (mp_parse_node_t)pn;
320}
321
322STATIC mp_parse_node_t make_node_const_object(parser_t *parser, mp_uint_t src_line, mp_obj_t obj) {
323 mp_parse_node_struct_t *pn = m_new_obj_var_maybe(mp_parse_node_struct_t, mp_parse_node_t, 1);
324 if (pn == NULL) {
325 memory_error(parser);
326 return MP_PARSE_NODE_NULL;
327 }
328 pn->source_line = src_line;
329 pn->kind_num_nodes = RULE_const_object | (1 << 8);
330 pn->nodes[0] = (mp_uint_t)obj;
331 return (mp_parse_node_t)pn;
Damien George5042bce2014-05-25 22:06:06 +0100332}
Paul Sokolovsky9e76b112014-05-08 22:43:46 +0300333
Damien Georgea4c52c52014-12-05 19:35:18 +0000334STATIC void push_result_token(parser_t *parser) {
Damiend99b0522013-12-21 18:17:45 +0000335 mp_parse_node_t pn;
Damien Georgea4c52c52014-12-05 19:35:18 +0000336 mp_lexer_t *lex = parser->lexer;
337 if (lex->tok_kind == MP_TOKEN_NAME) {
338 pn = mp_parse_node_new_leaf(MP_PARSE_NODE_ID, qstr_from_strn(lex->vstr.buf, lex->vstr.len));
Damien George7d414a12015-02-08 01:57:40 +0000339 } else if (lex->tok_kind == MP_TOKEN_INTEGER) {
340 mp_obj_t o = mp_parse_num_integer(lex->vstr.buf, lex->vstr.len, 0, lex);
341 if (MP_OBJ_IS_SMALL_INT(o)) {
342 pn = mp_parse_node_new_leaf(MP_PARSE_NODE_SMALL_INT, MP_OBJ_SMALL_INT_VALUE(o));
Damien429d7192013-10-04 19:53:11 +0100343 } else {
Damien George7d414a12015-02-08 01:57:40 +0000344 pn = make_node_const_object(parser, lex->tok_line, o);
Damien429d7192013-10-04 19:53:11 +0100345 }
Damien George7d414a12015-02-08 01:57:40 +0000346 } else if (lex->tok_kind == MP_TOKEN_FLOAT_OR_IMAG) {
347 mp_obj_t o = mp_parse_num_decimal(lex->vstr.buf, lex->vstr.len, true, false, lex);
348 pn = make_node_const_object(parser, lex->tok_line, o);
Damien George4c81ba82015-01-13 16:21:23 +0000349 } else if (lex->tok_kind == MP_TOKEN_STRING || lex->tok_kind == MP_TOKEN_BYTES) {
350 // Don't automatically intern all strings/bytes. doc strings (which are usually large)
Damien George5042bce2014-05-25 22:06:06 +0100351 // will be discarded by the compiler, and so we shouldn't intern them.
352 qstr qst = MP_QSTR_NULL;
Damien Georgea4c52c52014-12-05 19:35:18 +0000353 if (lex->vstr.len <= MICROPY_ALLOC_PARSE_INTERN_STRING_LEN) {
Damien George5042bce2014-05-25 22:06:06 +0100354 // intern short strings
Damien Georgea4c52c52014-12-05 19:35:18 +0000355 qst = qstr_from_strn(lex->vstr.buf, lex->vstr.len);
Damien George5042bce2014-05-25 22:06:06 +0100356 } else {
357 // check if this string is already interned
Damien Georgea4c52c52014-12-05 19:35:18 +0000358 qst = qstr_find_strn(lex->vstr.buf, lex->vstr.len);
Damien George5042bce2014-05-25 22:06:06 +0100359 }
360 if (qst != MP_QSTR_NULL) {
361 // qstr exists, make a leaf node
Damien George4c81ba82015-01-13 16:21:23 +0000362 pn = mp_parse_node_new_leaf(lex->tok_kind == MP_TOKEN_STRING ? MP_PARSE_NODE_STRING : MP_PARSE_NODE_BYTES, qst);
Damien George5042bce2014-05-25 22:06:06 +0100363 } else {
Damien George4c81ba82015-01-13 16:21:23 +0000364 // not interned, make a node holding a pointer to the string/bytes data
Damien George7d414a12015-02-08 01:57:40 +0000365 pn = make_node_string_bytes(parser, lex->tok_line, lex->tok_kind == MP_TOKEN_STRING ? RULE_string : RULE_bytes, lex->vstr.buf, lex->vstr.len);
Damien George5042bce2014-05-25 22:06:06 +0100366 }
Damien429d7192013-10-04 19:53:11 +0100367 } else {
Damien Georgea4c52c52014-12-05 19:35:18 +0000368 pn = mp_parse_node_new_leaf(MP_PARSE_NODE_TOKEN, lex->tok_kind);
Damien429d7192013-10-04 19:53:11 +0100369 }
370 push_result_node(parser, pn);
371}
372
Damien George38161822014-07-03 14:13:33 +0100373STATIC void push_result_rule(parser_t *parser, mp_uint_t src_line, const rule_t *rule, mp_uint_t num_args) {
Damien George58ba4c32014-04-10 14:27:31 +0000374 mp_parse_node_struct_t *pn = m_new_obj_var_maybe(mp_parse_node_struct_t, mp_parse_node_t, num_args);
375 if (pn == NULL) {
376 memory_error(parser);
377 return;
378 }
379 pn->source_line = src_line;
380 pn->kind_num_nodes = (rule->rule_id & 0xff) | (num_args << 8);
Damien George38161822014-07-03 14:13:33 +0100381 for (mp_uint_t i = num_args; i > 0; i--) {
Damien429d7192013-10-04 19:53:11 +0100382 pn->nodes[i - 1] = pop_result(parser);
383 }
Damiend99b0522013-12-21 18:17:45 +0000384 push_result_node(parser, (mp_parse_node_t)pn);
Damien429d7192013-10-04 19:53:11 +0100385}
386
Damien George0bfc7632015-02-07 18:33:58 +0000387mp_parse_node_t mp_parse(mp_lexer_t *lex, mp_parse_input_kind_t input_kind) {
Damien George69a818d2014-01-12 13:55:24 +0000388
Damien George1b82e9a2014-05-10 17:36:41 +0100389 // initialise parser and allocate memory for its stacks
Damien George69a818d2014-01-12 13:55:24 +0000390
Damien George1b82e9a2014-05-10 17:36:41 +0100391 parser_t parser;
Damien George69a818d2014-01-12 13:55:24 +0000392
Damien George1b82e9a2014-05-10 17:36:41 +0100393 parser.had_memory_error = false;
Damien George58ba4c32014-04-10 14:27:31 +0000394
Damien George58ebde42014-05-21 20:32:59 +0100395 parser.rule_stack_alloc = MICROPY_ALLOC_PARSE_RULE_INIT;
Damien George1b82e9a2014-05-10 17:36:41 +0100396 parser.rule_stack_top = 0;
397 parser.rule_stack = m_new_maybe(rule_stack_t, parser.rule_stack_alloc);
Damien429d7192013-10-04 19:53:11 +0100398
Damien George58ebde42014-05-21 20:32:59 +0100399 parser.result_stack_alloc = MICROPY_ALLOC_PARSE_RESULT_INIT;
Damien George1b82e9a2014-05-10 17:36:41 +0100400 parser.result_stack_top = 0;
401 parser.result_stack = m_new_maybe(mp_parse_node_t, parser.result_stack_alloc);
Damien429d7192013-10-04 19:53:11 +0100402
Damien George1b82e9a2014-05-10 17:36:41 +0100403 parser.lexer = lex;
404
405 // check if we could allocate the stacks
406 if (parser.rule_stack == NULL || parser.result_stack == NULL) {
407 goto memory_error;
408 }
Damien George08335002014-01-18 23:24:36 +0000409
Damien George69a818d2014-01-12 13:55:24 +0000410 // work out the top-level rule to use, and push it on the stack
Damien George38161822014-07-03 14:13:33 +0100411 mp_uint_t top_level_rule;
Damien5ac1b2e2013-10-18 19:58:12 +0100412 switch (input_kind) {
Damiend99b0522013-12-21 18:17:45 +0000413 case MP_PARSE_SINGLE_INPUT: top_level_rule = RULE_single_input; break;
Damien Georged02c6d82014-01-15 22:14:03 +0000414 case MP_PARSE_EVAL_INPUT: top_level_rule = RULE_eval_input; break;
Damien5ac1b2e2013-10-18 19:58:12 +0100415 default: top_level_rule = RULE_file_input;
416 }
Damien Georgea4c52c52014-12-05 19:35:18 +0000417 push_rule(&parser, lex->tok_line, rules[top_level_rule], 0);
Damien429d7192013-10-04 19:53:11 +0100418
Damien George69a818d2014-01-12 13:55:24 +0000419 // parse!
420
Damien George38161822014-07-03 14:13:33 +0100421 mp_uint_t n, i; // state for the current rule
422 mp_uint_t rule_src_line; // source line for the first token matched by the current rule
Damien429d7192013-10-04 19:53:11 +0100423 bool backtrack = false;
Damien George08335002014-01-18 23:24:36 +0000424 const rule_t *rule = NULL;
Damien429d7192013-10-04 19:53:11 +0100425
426 for (;;) {
427 next_rule:
Damien George1b82e9a2014-05-10 17:36:41 +0100428 if (parser.rule_stack_top == 0 || parser.had_memory_error) {
Damien429d7192013-10-04 19:53:11 +0100429 break;
430 }
431
Damien George1b82e9a2014-05-10 17:36:41 +0100432 pop_rule(&parser, &rule, &i, &rule_src_line);
Damien429d7192013-10-04 19:53:11 +0100433 n = rule->act & RULE_ACT_ARG_MASK;
434
435 /*
436 // debugging
Damien George1b82e9a2014-05-10 17:36:41 +0100437 printf("depth=%d ", parser.rule_stack_top);
438 for (int j = 0; j < parser.rule_stack_top; ++j) {
Damien429d7192013-10-04 19:53:11 +0100439 printf(" ");
440 }
441 printf("%s n=%d i=%d bt=%d\n", rule->rule_name, n, i, backtrack);
442 */
443
444 switch (rule->act & RULE_ACT_KIND_MASK) {
445 case RULE_ACT_OR:
446 if (i > 0 && !backtrack) {
447 goto next_rule;
448 } else {
449 backtrack = false;
450 }
451 for (; i < n - 1; ++i) {
452 switch (rule->arg[i] & RULE_ARG_KIND_MASK) {
453 case RULE_ARG_TOK:
Damien Georgea4c52c52014-12-05 19:35:18 +0000454 if (lex->tok_kind == (rule->arg[i] & RULE_ARG_ARG_MASK)) {
455 push_result_token(&parser);
Damiend99b0522013-12-21 18:17:45 +0000456 mp_lexer_to_next(lex);
Damien429d7192013-10-04 19:53:11 +0100457 goto next_rule;
458 }
459 break;
460 case RULE_ARG_RULE:
Damien Georged2d64f02015-01-14 21:32:42 +0000461 rule_or_no_other_choice:
Damien George1b82e9a2014-05-10 17:36:41 +0100462 push_rule(&parser, rule_src_line, rule, i + 1); // save this or-rule
463 push_rule_from_arg(&parser, rule->arg[i]); // push child of or-rule
Damien429d7192013-10-04 19:53:11 +0100464 goto next_rule;
465 default:
466 assert(0);
Damien Georged2d64f02015-01-14 21:32:42 +0000467 goto rule_or_no_other_choice; // to help flow control analysis
Damien429d7192013-10-04 19:53:11 +0100468 }
469 }
470 if ((rule->arg[i] & RULE_ARG_KIND_MASK) == RULE_ARG_TOK) {
Damien Georgea4c52c52014-12-05 19:35:18 +0000471 if (lex->tok_kind == (rule->arg[i] & RULE_ARG_ARG_MASK)) {
472 push_result_token(&parser);
Damiend99b0522013-12-21 18:17:45 +0000473 mp_lexer_to_next(lex);
Damien429d7192013-10-04 19:53:11 +0100474 } else {
475 backtrack = true;
476 goto next_rule;
477 }
478 } else {
Damien George1b82e9a2014-05-10 17:36:41 +0100479 push_rule_from_arg(&parser, rule->arg[i]);
Damien429d7192013-10-04 19:53:11 +0100480 }
481 break;
482
Damien George2870d852014-12-20 18:06:08 +0000483 case RULE_ACT_AND: {
Damien429d7192013-10-04 19:53:11 +0100484
485 // failed, backtrack if we can, else syntax error
486 if (backtrack) {
487 assert(i > 0);
488 if ((rule->arg[i - 1] & RULE_ARG_KIND_MASK) == RULE_ARG_OPT_RULE) {
489 // an optional rule that failed, so continue with next arg
Damien George1b82e9a2014-05-10 17:36:41 +0100490 push_result_node(&parser, MP_PARSE_NODE_NULL);
Damien429d7192013-10-04 19:53:11 +0100491 backtrack = false;
492 } else {
493 // a mandatory rule that failed, so propagate backtrack
494 if (i > 1) {
495 // already eaten tokens so can't backtrack
496 goto syntax_error;
497 } else {
498 goto next_rule;
499 }
500 }
501 }
502
503 // progress through the rule
504 for (; i < n; ++i) {
505 switch (rule->arg[i] & RULE_ARG_KIND_MASK) {
Damien George2870d852014-12-20 18:06:08 +0000506 case RULE_ARG_TOK: {
Damien429d7192013-10-04 19:53:11 +0100507 // need to match a token
Damien George2870d852014-12-20 18:06:08 +0000508 mp_token_kind_t tok_kind = rule->arg[i] & RULE_ARG_ARG_MASK;
Damien Georgea4c52c52014-12-05 19:35:18 +0000509 if (lex->tok_kind == tok_kind) {
Damien429d7192013-10-04 19:53:11 +0100510 // matched token
Damiend99b0522013-12-21 18:17:45 +0000511 if (tok_kind == MP_TOKEN_NAME) {
Damien Georgea4c52c52014-12-05 19:35:18 +0000512 push_result_token(&parser);
Damien429d7192013-10-04 19:53:11 +0100513 }
Damiend99b0522013-12-21 18:17:45 +0000514 mp_lexer_to_next(lex);
Damien429d7192013-10-04 19:53:11 +0100515 } else {
516 // failed to match token
517 if (i > 0) {
518 // already eaten tokens so can't backtrack
519 goto syntax_error;
520 } else {
521 // this rule failed, so backtrack
522 backtrack = true;
523 goto next_rule;
524 }
525 }
526 break;
Damien Georged2d64f02015-01-14 21:32:42 +0000527 }
Damien429d7192013-10-04 19:53:11 +0100528 case RULE_ARG_RULE:
Damien429d7192013-10-04 19:53:11 +0100529 case RULE_ARG_OPT_RULE:
Damien Georged2d64f02015-01-14 21:32:42 +0000530 rule_and_no_other_choice:
Damien George1b82e9a2014-05-10 17:36:41 +0100531 push_rule(&parser, rule_src_line, rule, i + 1); // save this and-rule
532 push_rule_from_arg(&parser, rule->arg[i]); // push child of and-rule
Damien429d7192013-10-04 19:53:11 +0100533 goto next_rule;
534 default:
535 assert(0);
Damien Georged2d64f02015-01-14 21:32:42 +0000536 goto rule_and_no_other_choice; // to help flow control analysis
Damien429d7192013-10-04 19:53:11 +0100537 }
538 }
539
540 assert(i == n);
541
542 // matched the rule, so now build the corresponding parse_node
543
544 // count number of arguments for the parse_node
545 i = 0;
Damien George2870d852014-12-20 18:06:08 +0000546 bool emit_rule = false;
Damien George38161822014-07-03 14:13:33 +0100547 for (mp_uint_t x = 0; x < n; ++x) {
Damien429d7192013-10-04 19:53:11 +0100548 if ((rule->arg[x] & RULE_ARG_KIND_MASK) == RULE_ARG_TOK) {
Damien George2870d852014-12-20 18:06:08 +0000549 mp_token_kind_t tok_kind = rule->arg[x] & RULE_ARG_ARG_MASK;
Damiend99b0522013-12-21 18:17:45 +0000550 if (tok_kind >= MP_TOKEN_NAME) {
Damien429d7192013-10-04 19:53:11 +0100551 emit_rule = true;
552 }
Damiend99b0522013-12-21 18:17:45 +0000553 if (tok_kind == MP_TOKEN_NAME) {
Damien429d7192013-10-04 19:53:11 +0100554 // only tokens which were names are pushed to stack
555 i += 1;
556 }
557 } else {
558 // rules are always pushed
559 i += 1;
560 }
561 }
562
Damien George5042bce2014-05-25 22:06:06 +0100563#if !MICROPY_EMIT_CPYTHON && !MICROPY_ENABLE_DOC_STRING
564 // this code discards lonely statements, such as doc strings
Damien George1b82e9a2014-05-10 17:36:41 +0100565 if (input_kind != MP_PARSE_SINGLE_INPUT && rule->rule_id == RULE_expr_stmt && peek_result(&parser, 0) == MP_PARSE_NODE_NULL) {
566 mp_parse_node_t p = peek_result(&parser, 1);
Damien George5042bce2014-05-25 22:06:06 +0100567 if ((MP_PARSE_NODE_IS_LEAF(p) && !MP_PARSE_NODE_IS_ID(p)) || MP_PARSE_NODE_IS_STRUCT_KIND(p, RULE_string)) {
Damien George52b5d762014-09-23 15:31:56 +0000568 pop_result(&parser); // MP_PARSE_NODE_NULL
569 mp_parse_node_free(pop_result(&parser)); // RULE_string
Damien George1b82e9a2014-05-10 17:36:41 +0100570 push_result_rule(&parser, rule_src_line, rules[RULE_pass_stmt], 0);
Damien George93afa232014-05-06 21:44:11 +0100571 break;
572 }
573 }
574#endif
575
Damien429d7192013-10-04 19:53:11 +0100576 // always emit these rules, even if they have only 1 argument
577 if (rule->rule_id == RULE_expr_stmt || rule->rule_id == RULE_yield_stmt) {
578 emit_rule = true;
579 }
580
Damien Georgeb47ea4e2014-12-20 18:37:50 +0000581 // if a rule has the RULE_ACT_ALLOW_IDENT bit set then this
582 // rule should not be emitted if it has only 1 argument
583 // NOTE: can't set this flag for atom_paren because we need it
584 // to distinguish, for example, [a,b] from [(a,b)]
585 // TODO possibly set for: varargslist_name, varargslist_equal
586 if (rule->act & RULE_ACT_ALLOW_IDENT) {
Damien429d7192013-10-04 19:53:11 +0100587 emit_rule = false;
588 }
589
590 // always emit these rules, and add an extra blank node at the end (to be used by the compiler to store data)
Damien Georgeb47ea4e2014-12-20 18:37:50 +0000591 if (ADD_BLANK_NODE(rule)) {
Damien429d7192013-10-04 19:53:11 +0100592 emit_rule = true;
Damien George1b82e9a2014-05-10 17:36:41 +0100593 push_result_node(&parser, MP_PARSE_NODE_NULL);
Damien429d7192013-10-04 19:53:11 +0100594 i += 1;
595 }
596
Damien George38161822014-07-03 14:13:33 +0100597 mp_uint_t num_not_nil = 0;
598 for (mp_uint_t x = 0; x < i; ++x) {
Damien George1b82e9a2014-05-10 17:36:41 +0100599 if (peek_result(&parser, x) != MP_PARSE_NODE_NULL) {
Damien429d7192013-10-04 19:53:11 +0100600 num_not_nil += 1;
601 }
602 }
Damien429d7192013-10-04 19:53:11 +0100603 if (emit_rule) {
Damien George1b82e9a2014-05-10 17:36:41 +0100604 push_result_rule(&parser, rule_src_line, rule, i);
Damien429d7192013-10-04 19:53:11 +0100605 } else if (num_not_nil == 0) {
Damien George1b82e9a2014-05-10 17:36:41 +0100606 push_result_rule(&parser, rule_src_line, rule, i); // needed for, eg, atom_paren, testlist_comp_3b
Damien429d7192013-10-04 19:53:11 +0100607 } else if (num_not_nil == 1) {
608 // single result, leave it on stack
Damiend99b0522013-12-21 18:17:45 +0000609 mp_parse_node_t pn = MP_PARSE_NODE_NULL;
Damien George38161822014-07-03 14:13:33 +0100610 for (mp_uint_t x = 0; x < i; ++x) {
Damien George1b82e9a2014-05-10 17:36:41 +0100611 mp_parse_node_t pn2 = pop_result(&parser);
Damiend99b0522013-12-21 18:17:45 +0000612 if (pn2 != MP_PARSE_NODE_NULL) {
Damien429d7192013-10-04 19:53:11 +0100613 pn = pn2;
614 }
615 }
Damien George1b82e9a2014-05-10 17:36:41 +0100616 push_result_node(&parser, pn);
Damien429d7192013-10-04 19:53:11 +0100617 } else {
Damien George1b82e9a2014-05-10 17:36:41 +0100618 push_result_rule(&parser, rule_src_line, rule, i);
Damien429d7192013-10-04 19:53:11 +0100619 }
620 break;
Damien George2870d852014-12-20 18:06:08 +0000621 }
Damien429d7192013-10-04 19:53:11 +0100622
Damien George2870d852014-12-20 18:06:08 +0000623 case RULE_ACT_LIST: {
Damien429d7192013-10-04 19:53:11 +0100624 // n=2 is: item item*
625 // n=1 is: item (sep item)*
626 // n=3 is: item (sep item)* [sep]
Damien George2870d852014-12-20 18:06:08 +0000627 bool had_trailing_sep;
Damien429d7192013-10-04 19:53:11 +0100628 if (backtrack) {
629 list_backtrack:
630 had_trailing_sep = false;
631 if (n == 2) {
632 if (i == 1) {
633 // fail on item, first time round; propagate backtrack
634 goto next_rule;
635 } else {
636 // fail on item, in later rounds; finish with this rule
637 backtrack = false;
638 }
639 } else {
640 if (i == 1) {
641 // fail on item, first time round; propagate backtrack
642 goto next_rule;
643 } else if ((i & 1) == 1) {
644 // fail on item, in later rounds; have eaten tokens so can't backtrack
645 if (n == 3) {
646 // list allows trailing separator; finish parsing list
647 had_trailing_sep = true;
648 backtrack = false;
649 } else {
650 // list doesn't allowing trailing separator; fail
651 goto syntax_error;
652 }
653 } else {
654 // fail on separator; finish parsing list
655 backtrack = false;
656 }
657 }
658 } else {
659 for (;;) {
Damien George38161822014-07-03 14:13:33 +0100660 mp_uint_t arg = rule->arg[i & 1 & n];
Damien429d7192013-10-04 19:53:11 +0100661 switch (arg & RULE_ARG_KIND_MASK) {
662 case RULE_ARG_TOK:
Damien Georgea4c52c52014-12-05 19:35:18 +0000663 if (lex->tok_kind == (arg & RULE_ARG_ARG_MASK)) {
Damien429d7192013-10-04 19:53:11 +0100664 if (i & 1 & n) {
665 // separators which are tokens are not pushed to result stack
666 } else {
Damien Georgea4c52c52014-12-05 19:35:18 +0000667 push_result_token(&parser);
Damien429d7192013-10-04 19:53:11 +0100668 }
Damiend99b0522013-12-21 18:17:45 +0000669 mp_lexer_to_next(lex);
Damien429d7192013-10-04 19:53:11 +0100670 // got element of list, so continue parsing list
671 i += 1;
672 } else {
673 // couldn't get element of list
674 i += 1;
675 backtrack = true;
676 goto list_backtrack;
677 }
678 break;
679 case RULE_ARG_RULE:
Damien Georged2d64f02015-01-14 21:32:42 +0000680 rule_list_no_other_choice:
Damien George1b82e9a2014-05-10 17:36:41 +0100681 push_rule(&parser, rule_src_line, rule, i + 1); // save this list-rule
682 push_rule_from_arg(&parser, arg); // push child of list-rule
Damien429d7192013-10-04 19:53:11 +0100683 goto next_rule;
684 default:
685 assert(0);
Damien Georged2d64f02015-01-14 21:32:42 +0000686 goto rule_list_no_other_choice; // to help flow control analysis
Damien429d7192013-10-04 19:53:11 +0100687 }
688 }
689 }
690 assert(i >= 1);
691
692 // compute number of elements in list, result in i
693 i -= 1;
694 if ((n & 1) && (rule->arg[1] & RULE_ARG_KIND_MASK) == RULE_ARG_TOK) {
695 // don't count separators when they are tokens
696 i = (i + 1) / 2;
697 }
698
699 if (i == 1) {
700 // list matched single item
701 if (had_trailing_sep) {
702 // if there was a trailing separator, make a list of a single item
Damien George1b82e9a2014-05-10 17:36:41 +0100703 push_result_rule(&parser, rule_src_line, rule, i);
Damien429d7192013-10-04 19:53:11 +0100704 } else {
705 // just leave single item on stack (ie don't wrap in a list)
706 }
707 } else {
Damien George1b82e9a2014-05-10 17:36:41 +0100708 push_result_rule(&parser, rule_src_line, rule, i);
Damien429d7192013-10-04 19:53:11 +0100709 }
710 break;
Damien George2870d852014-12-20 18:06:08 +0000711 }
Damien429d7192013-10-04 19:53:11 +0100712
713 default:
714 assert(0);
715 }
716 }
Damien91d387d2013-10-09 15:09:52 +0100717
Damien Georgef8048332015-02-08 13:40:20 +0000718 mp_obj_t exc;
719 mp_parse_node_t result;
Damien George58ba4c32014-04-10 14:27:31 +0000720
721 // check if we had a memory error
Damien George1b82e9a2014-05-10 17:36:41 +0100722 if (parser.had_memory_error) {
723memory_error:
Damien George0bfc7632015-02-07 18:33:58 +0000724 exc = mp_obj_new_exception_msg(&mp_type_MemoryError,
725 "parser could not allocate enough memory");
Damien Georgef8048332015-02-08 13:40:20 +0000726 result = MP_PARSE_NODE_NULL;
Damien George58ba4c32014-04-10 14:27:31 +0000727 goto finished;
Damien George58ba4c32014-04-10 14:27:31 +0000728 }
729
Damien91d387d2013-10-09 15:09:52 +0100730 // check we are at the end of the token stream
Damien Georgea4c52c52014-12-05 19:35:18 +0000731 if (lex->tok_kind != MP_TOKEN_END) {
Damien91d387d2013-10-09 15:09:52 +0100732 goto syntax_error;
Damien429d7192013-10-04 19:53:11 +0100733 }
Damien91d387d2013-10-09 15:09:52 +0100734
Damien429d7192013-10-04 19:53:11 +0100735 //result_stack_show(parser);
Damien George1b82e9a2014-05-10 17:36:41 +0100736 //printf("rule stack alloc: %d\n", parser.rule_stack_alloc);
737 //printf("result stack alloc: %d\n", parser.result_stack_alloc);
Damien429d7192013-10-04 19:53:11 +0100738 //printf("number of parse nodes allocated: %d\n", num_parse_nodes_allocated);
Damien George69a818d2014-01-12 13:55:24 +0000739
740 // get the root parse node that we created
Damien George1b82e9a2014-05-10 17:36:41 +0100741 assert(parser.result_stack_top == 1);
Damien Georgef8048332015-02-08 13:40:20 +0000742 exc = MP_OBJ_NULL;
Damien George1b82e9a2014-05-10 17:36:41 +0100743 result = parser.result_stack[0];
Damien George69a818d2014-01-12 13:55:24 +0000744
745finished:
746 // free the memory that we don't need anymore
Damien George1b82e9a2014-05-10 17:36:41 +0100747 m_del(rule_stack_t, parser.rule_stack, parser.rule_stack_alloc);
748 m_del(mp_parse_node_t, parser.result_stack, parser.result_stack_alloc);
Damien George0bfc7632015-02-07 18:33:58 +0000749 // we also free the lexer on behalf of the caller (see below)
Damien George69a818d2014-01-12 13:55:24 +0000750
Damien George0bfc7632015-02-07 18:33:58 +0000751 if (exc != MP_OBJ_NULL) {
752 // had an error so raise the exception
753 // add traceback to give info about file name and location
754 // we don't have a 'block' name, so just pass the NULL qstr to indicate this
755 mp_obj_exception_add_traceback(exc, lex->source_name, lex->tok_line, MP_QSTR_NULL);
756 mp_lexer_free(lex);
757 nlr_raise(exc);
758 } else {
759 mp_lexer_free(lex);
760 return result;
761 }
Damien429d7192013-10-04 19:53:11 +0100762
763syntax_error:
Damien Georgea4c52c52014-12-05 19:35:18 +0000764 if (lex->tok_kind == MP_TOKEN_INDENT) {
Damien George0bfc7632015-02-07 18:33:58 +0000765 exc = mp_obj_new_exception_msg(&mp_type_IndentationError,
766 "unexpected indent");
Damien Georgea4c52c52014-12-05 19:35:18 +0000767 } else if (lex->tok_kind == MP_TOKEN_DEDENT_MISMATCH) {
Damien George0bfc7632015-02-07 18:33:58 +0000768 exc = mp_obj_new_exception_msg(&mp_type_IndentationError,
769 "unindent does not match any outer indentation level");
Damien91d387d2013-10-09 15:09:52 +0100770 } else {
Damien George0bfc7632015-02-07 18:33:58 +0000771 exc = mp_obj_new_exception_msg(&mp_type_SyntaxError,
772 "invalid syntax");
Damien429d7192013-10-04 19:53:11 +0100773#ifdef USE_RULE_NAME
Damien George9528cd62014-01-15 21:23:31 +0000774 // debugging: print the rule name that failed and the token
Damien Georgec5966122014-02-15 16:10:44 +0000775 printf("rule: %s\n", rule->rule_name);
776#if MICROPY_DEBUG_PRINTERS
nhtshot5d323de2015-02-23 15:05:32 -0600777 mp_lexer_show_token(lex);
Damien George9528cd62014-01-15 21:23:31 +0000778#endif
Damien Georgec5966122014-02-15 16:10:44 +0000779#endif
Damien91d387d2013-10-09 15:09:52 +0100780 }
Damien Georgef8048332015-02-08 13:40:20 +0000781 result = MP_PARSE_NODE_NULL;
Damien George69a818d2014-01-12 13:55:24 +0000782 goto finished;
Damien429d7192013-10-04 19:53:11 +0100783}