11 MEM_VECTOR_MAKE(ast_value*, globals);
12 MEM_VECTOR_MAKE(ast_function*, functions);
13 MEM_VECTOR_MAKE(ast_value*, imm_float);
15 ast_function *function;
16 MEM_VECTOR_MAKE(ast_value*, locals);
20 MEM_VEC_FUNCTIONS(parser_t, ast_value*, globals)
21 MEM_VEC_FUNCTIONS(parser_t, ast_value*, imm_float)
22 MEM_VEC_FUNCTIONS(parser_t, ast_value*, locals)
23 MEM_VEC_FUNCTIONS(parser_t, ast_function*, functions)
25 void parseerror(parser_t *parser, const char *fmt, ...)
30 printf("error %s:%lu: ", parser->lex->tok->ctx.file, (unsigned long)parser->lex->tok->ctx.line);
41 bool parser_next(parser_t *parser)
43 /* lex_do kills the previous token */
44 parser->tok = lex_do(parser->lex);
45 if (parser->tok == TOKEN_EOF || parser->tok >= TOKEN_ERROR)
50 /* lift a token out of the parser so it's not destroyed by parser_next */
51 token *parser_lift(parser_t *parser)
53 token *tok = parser->lex->tok;
54 parser->lex->tok = NULL;
58 #define parser_tokval(p) (p->lex->tok->value)
59 #define parser_token(p) (p->lex->tok)
60 #define parser_ctx(p) (p->lex->tok->ctx)
62 ast_value* parser_const_float(parser_t *parser, double d)
66 for (i = 0; i < parser->imm_float_count; ++i) {
67 if (parser->imm_float[i]->constval.vfloat == d)
68 return parser->imm_float[i];
70 out = ast_value_new(parser_ctx(parser), "#IMMEDIATE", TYPE_FLOAT);
72 out->constval.vfloat = d;
73 if (!parser_t_imm_float_add(parser, out)) {
74 ast_value_delete(out);
80 ast_value* parser_find_global(parser_t *parser, const char *name)
83 for (i = 0; i < parser->globals_count; ++i) {
84 if (!strcmp(parser->globals[i]->name, name))
85 return parser->globals[i];
90 ast_value* parser_find_local(parser_t *parser, const char *name, size_t upto)
94 for (i = parser->locals_count; i > upto;) {
96 if (!strcmp(parser->locals[i]->name, name))
97 return parser->locals[i];
99 fun = parser->function->vtype;
100 for (i = 0; i < fun->params_count; ++i) {
101 if (!strcmp(fun->params[i]->name, name))
102 return fun->params[i];
107 ast_value* parser_find_var(parser_t *parser, const char *name)
110 v = parser_find_local(parser, name, 0);
111 if (!v) v = parser_find_global(parser, name);
116 MEM_VECTOR_MAKE(ast_value*, p);
118 MEM_VEC_FUNCTIONS(paramlist_t, ast_value*, p)
120 static ast_value *parser_parse_type(parser_t *parser, int basetype, bool *isfunc)
124 lex_ctx ctx = parser_ctx(parser);
125 int vtype = basetype;
129 MEM_VECTOR_INIT(¶ms, p);
133 if (parser->tok == '(') {
139 if (!parser_next(parser))
142 if (parser->tok == ')')
145 temptype = parser_token(parser)->constval.t;
146 if (!parser_next(parser))
149 param = parser_parse_type(parser, temptype, &dummy);
155 if (parser->tok == TOKEN_IDENT) {
156 /* named parameter */
157 if (!ast_value_set_name(param, parser_tokval(parser)))
159 if (!parser_next(parser))
163 if (!paramlist_t_p_add(¶ms, param)) {
164 parseerror(parser, "Out of memory while parsing typename");
168 if (parser->tok == ',')
170 if (parser->tok == ')')
172 parseerror(parser, "Unexpected token");
175 if (!parser_next(parser))
179 var = ast_value_new(ctx, "<unnamed>", vtype);
182 MEM_VECTOR_MOVE(¶ms, p, var, params);
185 for (i = 0; i < params.p_count; ++i)
186 ast_value_delete(params.p[i]);
187 MEM_VECTOR_CLEAR(¶ms, p);
193 size_t etype; /* 0 = expression, others are operators */
197 ast_value *value; /* need to know if we can assign */
198 ast_block *block; /* for commas and function calls */
203 MEM_VECTOR_MAKE(sy_elem, out);
204 MEM_VECTOR_MAKE(sy_elem, ops);
206 MEM_VEC_FUNCTIONS(shunt, sy_elem, out)
207 MEM_VEC_FUNCTIONS(shunt, sy_elem, ops)
209 static sy_elem syexp(lex_ctx ctx, ast_expression *v) {
219 static sy_elem syval(lex_ctx ctx, ast_value *v) {
222 e.out = (ast_expression*)v;
230 static sy_elem syblock(lex_ctx ctx, ast_block *v) {
233 e.out = (ast_expression*)v;
241 static sy_elem syop(lex_ctx ctx, const oper_info *op) {
243 e.etype = 1 + (op - operators);
252 static sy_elem syparen(lex_ctx ctx, int p, size_t off) {
264 static bool parser_sy_pop(parser_t *parser, shunt *sy)
268 ast_expression *out = NULL;
269 ast_expression *exprs[3];
271 ast_block *blocks[3];
274 if (!sy->ops_count) {
275 parseerror(parser, "internal error: missing operator");
279 if (sy->ops[sy->ops_count-1].paren) {
280 parseerror(parser, "unmatched parenthesis");
284 op = &operators[sy->ops[sy->ops_count-1].etype - 1];
285 ctx = sy->ops[sy->ops_count-1].ctx;
287 if (sy->out_count < op->operands) {
288 parseerror(parser, "internal error: not enough operands: %i", sy->out_count);
294 sy->out_count -= op->operands;
295 for (i = 0; i < op->operands; ++i) {
296 exprs[i] = sy->out[sy->out_count+i].out;
297 vars[i] = sy->out[sy->out_count+i].value;
298 blocks[i] = sy->out[sy->out_count+i].block;
301 if (blocks[0] && !blocks[0]->exprs_count && op->id != opid1(',')) {
302 parseerror(parser, "internal error: operator cannot be applied on empty blocks");
309 parseerror(parser, "internal error: unhandled operand");
314 if (!ast_block_exprs_add(blocks[0], exprs[1]))
317 blocks[0] = ast_block_new(ctx);
318 if (!ast_block_exprs_add(blocks[0], exprs[0]) ||
319 !ast_block_exprs_add(blocks[0], exprs[1]))
324 if (!ast_block_set_type(blocks[0], exprs[1]))
327 sy->out[sy->out_count++] = syblock(ctx, blocks[0]);
331 if (exprs[0]->expression.vtype != exprs[1]->expression.vtype) {
332 parseerror(parser, "Cannot add type %s and %s",
333 type_name[exprs[0]->expression.vtype],
334 type_name[exprs[1]->expression.vtype]);
337 switch (exprs[0]->expression.vtype) {
339 out = (ast_expression*)ast_binary_new(ctx, INSTR_ADD_F, exprs[0], exprs[1]);
342 out = (ast_expression*)ast_binary_new(ctx, INSTR_ADD_V, exprs[0], exprs[1]);
345 parseerror(parser, "Cannot add type %s and %s",
346 type_name[exprs[0]->expression.vtype],
347 type_name[exprs[1]->expression.vtype]);
352 if (exprs[0]->expression.vtype != exprs[1]->expression.vtype) {
353 parseerror(parser, "Cannot subtract type %s from %s",
354 type_name[exprs[1]->expression.vtype],
355 type_name[exprs[0]->expression.vtype]);
358 switch (exprs[0]->expression.vtype) {
360 out = (ast_expression*)ast_binary_new(ctx, INSTR_SUB_F, exprs[0], exprs[1]);
363 out = (ast_expression*)ast_binary_new(ctx, INSTR_SUB_V, exprs[0], exprs[1]);
366 parseerror(parser, "Cannot add type %s from %s",
367 type_name[exprs[1]->expression.vtype],
368 type_name[exprs[0]->expression.vtype]);
373 if (exprs[0]->expression.vtype != exprs[1]->expression.vtype &&
374 exprs[0]->expression.vtype != TYPE_VECTOR &&
375 exprs[0]->expression.vtype != TYPE_FLOAT &&
376 exprs[1]->expression.vtype != TYPE_VECTOR &&
377 exprs[1]->expression.vtype != TYPE_FLOAT)
379 parseerror(parser, "Cannot multiply type %s from %s",
380 type_name[exprs[1]->expression.vtype],
381 type_name[exprs[0]->expression.vtype]);
384 switch (exprs[0]->expression.vtype) {
386 if (exprs[1]->expression.vtype == TYPE_VECTOR)
387 out = (ast_expression*)ast_binary_new(ctx, INSTR_MUL_FV, exprs[0], exprs[1]);
389 out = (ast_expression*)ast_binary_new(ctx, INSTR_MUL_F, exprs[0], exprs[1]);
392 if (exprs[1]->expression.vtype == TYPE_FLOAT)
393 out = (ast_expression*)ast_binary_new(ctx, INSTR_MUL_VF, exprs[0], exprs[1]);
395 out = (ast_expression*)ast_binary_new(ctx, INSTR_MUL_V, exprs[0], exprs[1]);
398 parseerror(parser, "Cannot add type %s from %s",
399 type_name[exprs[1]->expression.vtype],
400 type_name[exprs[0]->expression.vtype]);
405 if (exprs[0]->expression.vtype != exprs[1]->expression.vtype ||
406 exprs[0]->expression.vtype != TYPE_FLOAT)
408 parseerror(parser, "Cannot divide types %s and %s",
409 type_name[exprs[0]->expression.vtype],
410 type_name[exprs[1]->expression.vtype]);
413 out = (ast_expression*)ast_binary_new(ctx, INSTR_DIV_F, exprs[0], exprs[1]);
419 parseerror(parser, "Cannot assign to non-variable");
422 out = (ast_expression*)ast_store_new(ctx,
423 type_store_instr[vars[0]->expression.vtype],
429 parseerror(parser, "failed to apply operand %s", op->op);
433 sy->out[sy->out_count++] = syexp(ctx, out);
437 static bool parser_close_call(parser_t *parser, shunt *sy)
439 /* was a function call */
447 fid = sy->ops[sy->ops_count].off;
449 /* out[fid] is the function
450 * everything above is parameters...
452 * 1 params = ast_expression
456 if (sy->out_count < 1 || sy->out_count <= fid) {
457 parseerror(parser, "internal error: function call needs function and parameter list...");
461 fun = sy->out[fid].out;
463 call = ast_call_new(sy->ops[sy->ops_count].ctx, fun);
465 parseerror(parser, "out of memory");
469 printf("fid = %i, out_count = %i\n", (int)fid, (int)sy->out_count);
471 if (fid+1 == sy->out_count) {
474 } else if (fid+2 == sy->out_count) {
477 params = sy->out[sy->out_count].block;
481 if (!ast_call_params_add(call, sy->out[sy->out_count].out)) {
482 ast_delete(sy->out[sy->out_count].out);
483 parseerror(parser, "out of memory");
487 paramcount = params->exprs_count;
488 MEM_VECTOR_MOVE(params, exprs, call, params);
492 parseerror(parser, "invalid function call");
496 /* overwrite fid, the function, with a call */
497 sy->out[fid] = syexp(call->expression.node.context, (ast_expression*)call);
499 if (fun->expression.vtype != TYPE_FUNCTION) {
500 parseerror(parser, "not a function");
504 if (!fun->expression.next) {
505 parseerror(parser, "could not determine function parameters");
509 ast_value *v = (ast_value*)(fun->expression.next);
510 if (v->params_count != paramcount) {
511 parseerror(parser, "expected %i parameters, got %i", (int)v->params_count, paramcount);
520 static bool parser_close_paren(parser_t *parser, shunt *sy, bool functions_only)
522 if (!sy->ops_count) {
523 parseerror(parser, "unmatched closing paren");
526 if (sy->ops[sy->ops_count-1].paren == 1) {
527 parseerror(parser, "empty parenthesis expression");
530 while (sy->ops_count) {
531 if (sy->ops[sy->ops_count-1].paren == 'f') {
532 if (!parser_close_call(parser, sy))
536 if (sy->ops[sy->ops_count-1].paren == 1) {
538 return !functions_only;
540 if (!parser_sy_pop(parser, sy))
546 static ast_expression* parser_expression(parser_t *parser)
548 ast_expression *expr = NULL;
552 MEM_VECTOR_INIT(&sy, out);
553 MEM_VECTOR_INIT(&sy, ops);
559 bool nextwant = true;
560 if (parser->tok == TOKEN_IDENT)
563 ast_value *var = parser_find_var(parser, parser_tokval(parser));
565 parseerror(parser, "unexpected ident: %s", parser_tokval(parser));
568 if (!shunt_out_add(&sy, syval(parser_ctx(parser), var))) {
569 parseerror(parser, "out of memory");
573 else if (parser->tok == TOKEN_FLOATCONST) {
574 ast_value *val = parser_const_float(parser, (parser_token(parser)->constval.f));
577 if (!shunt_out_add(&sy, syexp(parser_ctx(parser), (ast_expression*)val))) {
578 parseerror(parser, "out of memory");
582 else if (parser->tok == TOKEN_INTCONST) {
583 ast_value *val = parser_const_float(parser, (double)(parser_token(parser)->constval.i));
586 if (!shunt_out_add(&sy, syexp(parser_ctx(parser), (ast_expression*)val))) {
587 parseerror(parser, "out of memory");
591 else if (parser->tok == '(') {
592 nextwant = false; /* not expecting an operator next */
593 if (!shunt_ops_add(&sy, syparen(parser_ctx(parser), 1, 0))) {
594 parseerror(parser, "out of memory");
598 else if (parser->tok == ')') {
599 /* allowed for function calls */
600 if (!parser_close_paren(parser, &sy, true))
604 /* TODO: prefix operators */
605 parseerror(parser, "expected statement");
609 parser->lex->flags.noops = !wantop;
611 if (parser->tok == '(') {
612 /* we expected an operator, this is the function-call operator */
613 if (!shunt_ops_add(&sy, syparen(parser_ctx(parser), 'f', sy.out_count-1))) {
614 parseerror(parser, "out of memory");
618 else if (parser->tok == ')') {
619 /* we do expect an operator next */
620 /* closing an opening paren */
621 if (!parser_close_paren(parser, &sy, false))
624 else if (parser->tok != TOKEN_OPERATOR) {
625 parseerror(parser, "expected operator or end of statement");
629 /* classify the operator */
630 /* TODO: suffix operators */
632 const oper_info *olast = NULL;
634 for (o = 0; o < operator_count; ++o) {
635 if (!(operators[o].flags & OP_PREFIX) &&
636 !(operators[o].flags & OP_SUFFIX) && /* remove this */
637 !strcmp(parser_tokval(parser), operators[o].op))
642 if (o == operator_count) {
643 /* no operator found... must be the end of the statement */
646 /* found an operator */
649 if (sy.ops_count && !sy.ops[sy.ops_count-1].paren)
650 olast = &operators[sy.ops[sy.ops_count-1].etype-1];
653 (op->prec < olast->prec) ||
654 (op->assoc == ASSOC_LEFT && op->prec <= olast->prec) ) )
656 if (!parser_sy_pop(parser, &sy))
658 if (sy.ops_count && !sy.ops[sy.ops_count-1].paren)
659 olast = &operators[sy.ops[sy.ops_count-1].etype-1];
662 if (!shunt_ops_add(&sy, syop(parser_ctx(parser), op)))
666 parser->lex->flags.noops = true;
668 if (!parser_next(parser)) {
671 if (parser->tok == ';') {
675 if (!parser_next(parser)) {
676 parseerror(parser, "Unexpected end of file");
680 while (sy.ops_count) {
681 if (!parser_sy_pop(parser, &sy))
685 parser->lex->flags.noops = true;
687 parseerror(parser, "empty expression");
690 expr = sy.out[0].out;
691 MEM_VECTOR_CLEAR(&sy, out);
692 MEM_VECTOR_CLEAR(&sy, ops);
696 parser->lex->flags.noops = true;
697 MEM_VECTOR_CLEAR(&sy, out);
698 MEM_VECTOR_CLEAR(&sy, ops);
702 static bool parser_variable(parser_t *parser, ast_block *localblock);
703 static bool parser_body_do(parser_t *parser, ast_block *block)
705 if (parser->tok == TOKEN_TYPENAME)
708 if (!parser_variable(parser, block))
712 else if (parser->tok == TOKEN_KEYWORD)
714 if (!strcmp(parser_tokval(parser), "return"))
719 if (!parser_next(parser)) {
720 parseerror(parser, "expected return expression");
724 exp = parser_expression(parser);
727 ret = ast_return_new(exp->expression.node.context, exp);
732 if (!ast_block_exprs_add(block, (ast_expression*)ret)) {
738 parseerror(parser, "Unexpected keyword");
741 else if (parser->tok == '{')
744 parseerror(parser, "TODO: inner blocks: %s", parser_tokval(parser));
749 ast_expression *exp = parser_expression(parser);
752 if (!ast_block_exprs_add(block, exp)) {
760 static ast_block* parser_parse_block(parser_t *parser)
762 size_t oldblocklocal;
763 ast_block *block = NULL;
765 oldblocklocal = parser->blocklocal;
766 parser->blocklocal = parser->locals_count;
768 if (!parser_next(parser)) { /* skip the '{' */
769 parseerror(parser, "expected function body");
773 block = ast_block_new(parser_ctx(parser));
775 while (parser->tok != TOKEN_EOF && parser->tok < TOKEN_ERROR)
777 if (parser->tok == '}')
780 if (!parser_body_do(parser, block)) {
781 ast_block_delete(block);
787 if (parser->tok != '}') {
788 ast_block_delete(block);
791 (void)parser_next(parser);
795 parser->blocklocal = oldblocklocal;
799 static bool parser_variable(parser_t *parser, ast_block *localblock)
802 ast_function *func = NULL;
806 int basetype = parser_token(parser)->constval.t;
810 if (!parser_next(parser)) { /* skip basetype or comma */
811 parseerror(parser, "expected variable declaration");
817 ctx = parser_ctx(parser);
818 var = parser_parse_type(parser, basetype, &isfunc);
823 if (parser->tok != TOKEN_IDENT) {
824 parseerror(parser, "expected variable name\n");
828 if (!localblock && parser_find_global(parser, parser_tokval(parser))) {
829 ast_value_delete(var);
830 parseerror(parser, "global already exists: %s\n", parser_tokval(parser));
834 if (localblock && parser_find_local(parser, parser_tokval(parser), parser->blocklocal)) {
835 ast_value_delete(var);
836 parseerror(parser, "local variable already exists: %s\n", parser_tokval(parser));
840 if (!ast_value_set_name(var, parser_tokval(parser))) {
841 parseerror(parser, "failed to set variable name\n");
842 ast_value_delete(var);
847 /* a function was defined */
850 /* turn var into a value of TYPE_FUNCTION, with the old var
853 fval = ast_value_new(ctx, var->name, TYPE_FUNCTION);
854 func = ast_function_new(ctx, var->name, fval);
855 if (!fval || !func) {
856 ast_value_delete(var);
857 if (fval) ast_value_delete(fval);
858 if (func) ast_function_delete(func);
862 fval->expression.next = (ast_expression*)var;
863 MEM_VECTOR_MOVE(var, params, fval, params);
865 if (!parser_t_functions_add(parser, func)) {
866 ast_value_delete(var);
867 if (fval) ast_value_delete(fval);
868 if (func) ast_function_delete(func);
875 if ( (!localblock && !parser_t_globals_add(parser, var)) ||
876 ( localblock && !parser_t_locals_add(parser, var)) )
878 ast_value_delete(var);
881 if (localblock && !ast_block_locals_add(localblock, var))
883 parser->locals_count--;
884 ast_value_delete(var);
888 if (!parser_next(parser)) {
889 ast_value_delete(var);
893 if (parser->tok == ';') {
894 if (!parser_next(parser))
895 return parser->tok == TOKEN_EOF;
899 if (parser->tok == ',') {
904 if (parser->tok != '=') {
905 parseerror(parser, "expected '=' or ';'");
909 if (!parser_next(parser))
912 if (parser->tok == '#') {
914 parseerror(parser, "cannot declare builtins within functions");
917 if (!isfunc || !func) {
918 parseerror(parser, "unexpected builtin number, '%s' is not a function", var->name);
921 if (!parser_next(parser)) {
922 parseerror(parser, "expected builtin number");
925 if (parser->tok != TOKEN_INTCONST) {
926 parseerror(parser, "builtin number must be an integer constant");
929 if (parser_token(parser)->constval.i <= 0) {
930 parseerror(parser, "builtin number must be positive integer greater than zero");
934 func->builtin = -parser_token(parser)->constval.i;
935 } else if (parser->tok == '{') {
938 ast_function *old = parser->function;
941 parseerror(parser, "cannot declare functions within functions");
945 parser->function = func;
946 block = parser_parse_block(parser);
947 parser->function = old;
952 if (!ast_function_blocks_add(func, block)) {
953 ast_block_delete(block);
958 parseerror(parser, "TODO, const assignment");
961 if (!parser_next(parser))
964 if (parser->tok == ',') {
969 if (parser->tok != ';') {
970 parseerror(parser, "expected semicolon");
974 (void)parser_next(parser);
980 static bool parser_do(parser_t *parser)
982 if (parser->tok == TOKEN_TYPENAME)
984 return parser_variable(parser, NULL);
986 else if (parser->tok == TOKEN_KEYWORD)
988 /* handle 'var' and 'const' */
991 else if (parser->tok == '.')
993 /* entity-member declaration */
998 parseerror(parser, "unexpected token: %s", parser->lex->tok->value);
1004 bool parser_compile(const char *filename)
1010 parser = (parser_t*)mem_a(sizeof(parser_t));
1014 memset(parser, 0, sizeof(parser));
1016 MEM_VECTOR_INIT(parser, globals);
1017 MEM_VECTOR_INIT(parser, locals);
1018 parser->lex = lex_open(filename);
1021 printf("failed to open file \"%s\"\n", filename);
1025 /* initial lexer/parser state */
1026 parser->lex->flags.noops = true;
1028 if (parser_next(parser))
1030 while (parser->tok != TOKEN_EOF && parser->tok < TOKEN_ERROR)
1032 if (!parser_do(parser)) {
1033 if (parser->tok == TOKEN_EOF)
1034 parseerror(parser, "unexpected eof");
1036 parseerror(parser, "parse error\n");
1037 lex_close(parser->lex);
1044 lex_close(parser->lex);
1046 ir = ir_builder_new("gmqcc_out");
1048 printf("failed to allocate builder\n");
1052 for (i = 0; i < parser->imm_float_count; ++i) {
1053 if (!ast_global_codegen(parser->imm_float[i], ir)) {
1054 printf("failed to generate global %s\n", parser->imm_float[i]->name);
1057 for (i = 0; i < parser->globals_count; ++i) {
1058 if (!ast_global_codegen(parser->globals[i], ir)) {
1059 printf("failed to generate global %s\n", parser->globals[i]->name);
1062 for (i = 0; i < parser->functions_count; ++i) {
1063 if (!ast_function_codegen(parser->functions[i], ir)) {
1064 printf("failed to generate function %s\n", parser->functions[i]->name);
1066 if (!ir_function_finalize(parser->functions[i]->ir_func)) {
1067 printf("failed to finalize function %s\n", parser->functions[i]->name);
1071 ir_builder_dump(ir, printf);
1074 for (i = 0; i < parser->globals_count; ++i) {
1075 ast_value_delete(parser->globals[i]);
1077 MEM_VECTOR_CLEAR(parser, globals);