11 MEM_VECTOR_MAKE(ast_value*, globals);
12 MEM_VECTOR_MAKE(ast_function*, functions);
13 MEM_VECTOR_MAKE(ast_value*, imm_float);
15 ast_function *function;
16 MEM_VECTOR_MAKE(ast_value*, locals);
20 MEM_VEC_FUNCTIONS(parser_t, ast_value*, globals)
21 MEM_VEC_FUNCTIONS(parser_t, ast_value*, imm_float)
22 MEM_VEC_FUNCTIONS(parser_t, ast_value*, locals)
23 MEM_VEC_FUNCTIONS(parser_t, ast_function*, functions)
25 void parseerror(parser_t *parser, const char *fmt, ...)
30 printf("error %s:%lu: ", parser->lex->tok->ctx.file, (unsigned long)parser->lex->tok->ctx.line);
41 bool parser_next(parser_t *parser)
43 /* lex_do kills the previous token */
44 parser->tok = lex_do(parser->lex);
45 if (parser->tok == TOKEN_EOF || parser->tok >= TOKEN_ERROR)
50 /* lift a token out of the parser so it's not destroyed by parser_next */
51 token *parser_lift(parser_t *parser)
53 token *tok = parser->lex->tok;
54 parser->lex->tok = NULL;
58 #define parser_tokval(p) (p->lex->tok->value)
59 #define parser_token(p) (p->lex->tok)
60 #define parser_ctx(p) (p->lex->tok->ctx)
62 ast_value* parser_const_float(parser_t *parser, double d)
66 for (i = 0; i < parser->imm_float_count; ++i) {
67 if (parser->imm_float[i]->constval.vfloat == d)
68 return parser->imm_float[i];
70 out = ast_value_new(parser_ctx(parser), "#IMMEDIATE", TYPE_FLOAT);
72 out->constval.vfloat = d;
73 if (!parser_t_imm_float_add(parser, out)) {
74 ast_value_delete(out);
80 ast_value* parser_find_global(parser_t *parser, const char *name)
83 for (i = 0; i < parser->globals_count; ++i) {
84 if (!strcmp(parser->globals[i]->name, name))
85 return parser->globals[i];
90 ast_value* parser_find_local(parser_t *parser, const char *name, size_t upto)
93 for (i = parser->locals_count; i > upto;) {
95 if (!strcmp(parser->locals[i]->name, name))
96 return parser->locals[i];
101 ast_value* parser_find_var(parser_t *parser, const char *name)
104 v = parser_find_local(parser, name, 0);
105 if (!v) v = parser_find_global(parser, name);
110 MEM_VECTOR_MAKE(ast_value*, p);
112 MEM_VEC_FUNCTIONS(paramlist_t, ast_value*, p)
114 static ast_value *parser_parse_type(parser_t *parser, int basetype, bool *isfunc)
118 lex_ctx ctx = parser_ctx(parser);
119 int vtype = basetype;
122 MEM_VECTOR_INIT(¶ms, p);
126 if (parser->tok == '(') {
132 if (!parser_next(parser)) {
133 MEM_VECTOR_CLEAR(¶ms, p);
137 if (parser->tok == ')')
140 temptype = parser_token(parser)->constval.t;
141 if (!parser_next(parser)) {
142 MEM_VECTOR_CLEAR(¶ms, p);
145 param = parser_parse_type(parser, temptype, &dummy);
149 MEM_VECTOR_CLEAR(¶ms, p);
153 if (!paramlist_t_p_add(¶ms, param)) {
154 MEM_VECTOR_CLEAR(¶ms, p);
155 parseerror(parser, "Out of memory while parsing typename");
159 if (parser->tok == ',')
161 if (parser->tok == ')')
163 MEM_VECTOR_CLEAR(¶ms, p);
164 parseerror(parser, "Unexpected token");
167 if (!parser_next(parser)) {
168 MEM_VECTOR_CLEAR(¶ms, p);
173 var = ast_value_new(ctx, "<unnamed>", vtype);
175 MEM_VECTOR_CLEAR(¶ms, p);
178 MEM_VECTOR_MOVE(¶ms, p, var, params);
184 size_t etype; /* 0 = expression, others are operators */
189 MEM_VECTOR_MAKE(sy_elem, out);
190 MEM_VECTOR_MAKE(sy_elem, ops);
192 MEM_VEC_FUNCTIONS(shynt, sy_elem, out)
193 MEM_VEC_FUNCTIONS(shynt, sy_elem, ops)
195 static sy_elem syexp(ast_expression *v) {
201 static sy_elem syval(ast_value *v) { return syexp((ast_expression*)v); }
203 static sy_elem syop(const oper_info *op) {
205 e.etype = 1 + (op - operators);
210 static bool parser_sy_pop(parser_t *parser, shynt *sy)
213 ast_expression *vals[3];
216 if (!sy->ops_count) {
217 parseerror(parser, "internal error: missing operator");
221 op = &operators[sy->ops[sy->ops_count-1].etype - 1];
223 if (sy->out_count < op->operands) {
224 parseerror(parser, "internal error: not enough operands");
230 sy->out_count -= op->operands;
231 for (i = 0; i < op->operands; ++i)
232 vals[i] = sy->out[sy->out_count+i].out;
237 parseerror(parser, "internal error: unhandled operand");
244 static ast_expression* parser_expression(parser_t *parser)
246 ast_expression *expr = NULL;
250 MEM_VECTOR_INIT(&sy, out);
251 MEM_VECTOR_INIT(&sy, ops);
257 if (parser->tok == TOKEN_IDENT)
260 ast_value *var = parser_find_var(parser, parser_tokval(parser));
262 parseerror(parser, "unexpected ident: %s", parser_tokval(parser));
265 if (!shynt_out_add(&sy, syval(var))) {
266 parseerror(parser, "out of memory");
269 } else if (parser->tok == TOKEN_FLOATCONST) {
270 ast_value *val = parser_const_float(parser, (parser_token(parser)->constval.f));
273 if (!shynt_out_add(&sy, syval(val))) {
274 parseerror(parser, "out of memory");
277 } else if (parser->tok == TOKEN_INTCONST) {
278 ast_value *val = parser_const_float(parser, (double)(parser_token(parser)->constval.i));
281 if (!shynt_out_add(&sy, syval(val))) {
282 parseerror(parser, "out of memory");
286 /* TODO: prefix operators */
287 parseerror(parser, "expected statement");
291 parser->lex->flags.noops = false;
292 if (!parser_next(parser)) {
296 if (parser->tok != TOKEN_OPERATOR) {
297 parseerror(parser, "expected operator or end of statement");
300 /* classify the operator */
301 /* TODO: suffix operators */
303 const oper_info *olast = NULL;
305 for (o = 0; o < operator_count; ++o) {
306 if (!(operators[o].flags & OP_PREFIX) &&
307 !(operators[o].flags & OP_SUFFIX) && /* remove this */
308 !strcmp(parser_tokval(parser), operators[o].op))
313 if (o == operator_count) {
314 /* no operator found... must be the end of the statement */
317 /* found an operator */
321 olast = &operators[sy.ops[sy.ops_count-1].etype-1];
324 (op->prec < olast->prec) ||
325 (op->assoc == ASSOC_LEFT && op->prec <= olast->prec) ) )
327 if (!parser_sy_pop(parser, &sy))
329 olast = sy.ops_count ? (&operators[sy.ops[sy.ops_count-1].etype-1]) : NULL;
332 if (!shynt_ops_add(&sy, syop(op)))
336 parser->lex->flags.noops = true;
337 if (!parser_next(parser)) {
343 while (sy.ops_count) {
344 if (!parser_sy_pop(parser, &sy))
348 parser->lex->flags.noops = true;
350 parseerror(parser, "empty expression");
353 expr = sy.out[0].out;
354 MEM_VECTOR_CLEAR(&sy, out);
355 MEM_VECTOR_CLEAR(&sy, ops);
359 parser->lex->flags.noops = true;
360 MEM_VECTOR_CLEAR(&sy, out);
361 MEM_VECTOR_CLEAR(&sy, ops);
365 static bool parser_variable(parser_t *parser, bool global);
366 static bool parser_body_do(parser_t *parser, ast_block *block)
368 if (parser->tok == TOKEN_TYPENAME)
371 if (!parser_variable(parser, false))
375 else if (parser->tok == '{')
378 parseerror(parser, "TODO: inner blocks");
383 ast_expression *exp = parser_expression(parser);
386 if (!ast_block_exprs_add(block, exp))
392 static ast_block* parser_parse_block(parser_t *parser)
394 size_t oldblocklocal;
395 ast_block *block = NULL;
397 oldblocklocal = parser->blocklocal;
398 parser->blocklocal = parser->locals_count;
400 if (!parser_next(parser)) { /* skip the '{' */
401 parseerror(parser, "expected function body");
405 block = ast_block_new(parser_ctx(parser));
407 while (parser->tok != TOKEN_EOF && parser->tok < TOKEN_ERROR)
409 if (parser->tok == '}')
412 if (!parser_body_do(parser, block)) {
413 ast_block_delete(block);
419 if (parser->tok != '}') {
420 ast_block_delete(block);
423 (void)parser_next(parser);
427 parser->blocklocal = oldblocklocal;
431 static bool parser_variable(parser_t *parser, bool global)
434 ast_function *func = NULL;
438 int basetype = parser_token(parser)->constval.t;
442 if (!parser_next(parser)) { /* skip basetype or comma */
443 parseerror(parser, "expected variable declaration");
449 ctx = parser_ctx(parser);
450 var = parser_parse_type(parser, basetype, &isfunc);
455 if (parser->tok != TOKEN_IDENT) {
456 parseerror(parser, "expected variable name\n");
460 if (global && parser_find_global(parser, parser_tokval(parser))) {
461 ast_value_delete(var);
462 parseerror(parser, "global already exists: %s\n", parser_tokval(parser));
466 if (!global && parser_find_local(parser, parser_tokval(parser), parser->blocklocal)) {
467 ast_value_delete(var);
468 parseerror(parser, "local variable already exists: %s\n", parser_tokval(parser));
472 if (!ast_value_set_name(var, parser_tokval(parser))) {
473 parseerror(parser, "failed to set variable name\n");
474 ast_value_delete(var);
479 /* a function was defined */
482 /* turn var into a value of TYPE_FUNCTION, with the old var
485 fval = ast_value_new(ctx, var->name, TYPE_FUNCTION);
486 func = ast_function_new(ctx, var->name, fval);
487 if (!fval || !func) {
488 ast_value_delete(var);
489 if (fval) ast_value_delete(fval);
490 if (func) ast_function_delete(func);
494 fval->expression.next = (ast_expression*)var;
495 MEM_VECTOR_MOVE(var, params, fval, params);
497 if (!parser_t_functions_add(parser, func)) {
498 ast_value_delete(var);
499 if (fval) ast_value_delete(fval);
500 if (func) ast_function_delete(func);
507 if ( ( global && !parser_t_globals_add(parser, var)) ||
508 (!global && !parser_t_locals_add(parser, var)) )
510 ast_value_delete(var);
514 if (!parser_next(parser)) {
515 ast_value_delete(var);
519 if (parser->tok == ';') {
520 if (!parser_next(parser))
521 return parser->tok == TOKEN_EOF;
525 if (parser->tok == ',') {
530 if (parser->tok != '=') {
531 parseerror(parser, "expected '=' or ';'");
535 if (!parser_next(parser))
538 if (parser->tok == '#') {
540 parseerror(parser, "cannot declare builtins within functions");
543 if (!isfunc || !func) {
544 parseerror(parser, "unexpected builtin number, '%s' is not a function", var->name);
547 if (!parser_next(parser)) {
548 parseerror(parser, "expected builtin number");
551 if (parser->tok != TOKEN_INTCONST) {
552 parseerror(parser, "builtin number must be an integer constant");
555 if (parser_token(parser)->constval.i <= 0) {
556 parseerror(parser, "builtin number must be positive integer greater than zero");
560 func->builtin = -parser_token(parser)->constval.i;
561 } else if (parser->tok == '{') {
564 ast_function *old = parser->function;
567 parseerror(parser, "cannot declare functions within functions");
571 parser->function = func;
572 block = parser_parse_block(parser);
573 parser->function = old;
578 if (!ast_function_blocks_add(func, block)) {
579 ast_block_delete(block);
584 parseerror(parser, "TODO, const assignment");
587 if (!parser_next(parser))
590 if (parser->tok == ',') {
595 if (parser->tok != ';') {
596 parseerror(parser, "expected semicolon");
600 (void)parser_next(parser);
606 static bool parser_do(parser_t *parser)
608 if (parser->tok == TOKEN_TYPENAME)
610 return parser_variable(parser, true);
612 else if (parser->tok == TOKEN_KEYWORD)
614 /* handle 'var' and 'const' */
617 else if (parser->tok == '.')
619 /* entity-member declaration */
624 parseerror(parser, "unexpected token: %s", parser->lex->tok->value);
630 bool parser_compile(const char *filename)
636 parser = (parser_t*)mem_a(sizeof(parser_t));
640 memset(parser, 0, sizeof(parser));
642 MEM_VECTOR_INIT(parser, globals);
643 MEM_VECTOR_INIT(parser, locals);
644 parser->lex = lex_open(filename);
647 printf("failed to open file \"%s\"\n", filename);
651 /* initial lexer/parser state */
652 parser->lex->flags.noops = true;
654 if (parser_next(parser))
656 while (parser->tok != TOKEN_EOF && parser->tok < TOKEN_ERROR)
658 if (!parser_do(parser)) {
659 if (parser->tok == TOKEN_EOF)
660 parseerror(parser, "unexpected eof");
662 parseerror(parser, "parse error\n");
663 lex_close(parser->lex);
670 lex_close(parser->lex);
672 ir = ir_builder_new("gmqcc_out");
674 printf("failed to allocate builder\n");
678 for (i = 0; i < parser->imm_float_count; ++i) {
679 if (!ast_global_codegen(parser->imm_float[i], ir)) {
680 printf("failed to generate global %s\n", parser->imm_float[i]->name);
683 for (i = 0; i < parser->globals_count; ++i) {
684 if (!ast_global_codegen(parser->globals[i], ir)) {
685 printf("failed to generate global %s\n", parser->globals[i]->name);
688 for (i = 0; i < parser->functions_count; ++i) {
689 if (!ast_function_codegen(parser->functions[i], ir)) {
690 printf("failed to generate function %s\n", parser->functions[i]->name);
692 if (!ir_function_finalize(parser->functions[i]->ir_func)) {
693 printf("failed to finalize function %s\n", parser->functions[i]->name);
697 ir_builder_dump(ir, printf);
700 for (i = 0; i < parser->globals_count; ++i) {
701 ast_value_delete(parser->globals[i]);
703 MEM_VECTOR_CLEAR(parser, globals);