11 MEM_VECTOR_MAKE(ast_value*, globals);
12 MEM_VECTOR_MAKE(ast_function*, functions);
13 MEM_VECTOR_MAKE(ast_value*, imm_float);
15 ast_function *function;
16 MEM_VECTOR_MAKE(ast_value*, locals);
20 MEM_VEC_FUNCTIONS(parser_t, ast_value*, globals)
21 MEM_VEC_FUNCTIONS(parser_t, ast_value*, imm_float)
22 MEM_VEC_FUNCTIONS(parser_t, ast_value*, locals)
23 MEM_VEC_FUNCTIONS(parser_t, ast_function*, functions)
25 void parseerror(parser_t *parser, const char *fmt, ...)
30 printf("error %s:%lu: ", parser->lex->tok->ctx.file, (unsigned long)parser->lex->tok->ctx.line);
41 bool parser_next(parser_t *parser)
43 /* lex_do kills the previous token */
44 parser->tok = lex_do(parser->lex);
45 if (parser->tok == TOKEN_EOF || parser->tok >= TOKEN_ERROR)
50 /* lift a token out of the parser so it's not destroyed by parser_next */
51 token *parser_lift(parser_t *parser)
53 token *tok = parser->lex->tok;
54 parser->lex->tok = NULL;
58 #define parser_tokval(p) (p->lex->tok->value)
59 #define parser_token(p) (p->lex->tok)
60 #define parser_ctx(p) (p->lex->tok->ctx)
62 ast_value* parser_const_float(parser_t *parser, double d)
66 for (i = 0; i < parser->imm_float_count; ++i) {
67 if (parser->imm_float[i]->constval.vfloat == d)
68 return parser->imm_float[i];
70 out = ast_value_new(parser_ctx(parser), "#IMMEDIATE", TYPE_FLOAT);
72 out->constval.vfloat = d;
73 if (!parser_t_imm_float_add(parser, out)) {
74 ast_value_delete(out);
80 ast_value* parser_find_global(parser_t *parser, const char *name)
83 for (i = 0; i < parser->globals_count; ++i) {
84 if (!strcmp(parser->globals[i]->name, name))
85 return parser->globals[i];
90 ast_value* parser_find_local(parser_t *parser, const char *name, size_t upto)
93 for (i = parser->locals_count; i > upto;) {
95 if (!strcmp(parser->locals[i]->name, name))
96 return parser->locals[i];
101 ast_value* parser_find_var(parser_t *parser, const char *name)
104 v = parser_find_local(parser, name, 0);
105 if (!v) v = parser_find_global(parser, name);
110 MEM_VECTOR_MAKE(ast_value*, p);
112 MEM_VEC_FUNCTIONS(paramlist_t, ast_value*, p)
114 static ast_value *parser_parse_type(parser_t *parser, int basetype, bool *isfunc)
118 lex_ctx ctx = parser_ctx(parser);
119 int vtype = basetype;
123 MEM_VECTOR_INIT(¶ms, p);
127 if (parser->tok == '(') {
133 if (!parser_next(parser))
136 if (parser->tok == ')')
139 temptype = parser_token(parser)->constval.t;
140 if (!parser_next(parser))
143 param = parser_parse_type(parser, temptype, &dummy);
149 if (parser->tok == TOKEN_IDENT) {
150 /* named parameter */
151 if (!ast_value_set_name(param, parser_tokval(parser)))
153 if (!parser_next(parser))
157 if (!paramlist_t_p_add(¶ms, param)) {
158 parseerror(parser, "Out of memory while parsing typename");
162 if (parser->tok == ',')
164 if (parser->tok == ')')
166 parseerror(parser, "Unexpected token");
169 if (!parser_next(parser))
173 var = ast_value_new(ctx, "<unnamed>", vtype);
176 MEM_VECTOR_MOVE(¶ms, p, var, params);
179 for (i = 0; i < params.p_count; ++i)
180 ast_value_delete(params.p[i]);
181 MEM_VECTOR_CLEAR(¶ms, p);
187 size_t etype; /* 0 = expression, others are operators */
190 ast_value *value; /* need to know if we can assign */
195 MEM_VECTOR_MAKE(sy_elem, out);
196 MEM_VECTOR_MAKE(sy_elem, ops);
198 MEM_VEC_FUNCTIONS(shunt, sy_elem, out)
199 MEM_VEC_FUNCTIONS(shunt, sy_elem, ops)
201 static sy_elem syexp(lex_ctx ctx, ast_expression *v) {
210 static sy_elem syval(lex_ctx ctx, ast_value *v) {
213 e.out = (ast_expression*)v;
220 static sy_elem syop(lex_ctx ctx, const oper_info *op) {
222 e.etype = 1 + (op - operators);
230 static sy_elem syparen(lex_ctx ctx, int p) {
240 static bool parser_sy_pop(parser_t *parser, shunt *sy)
244 ast_expression *out = NULL;
245 ast_expression *exprs[3];
249 if (!sy->ops_count) {
250 parseerror(parser, "internal error: missing operator");
254 if (sy->ops[sy->ops_count-1].paren) {
255 parseerror(parser, "unmatched parenthesis");
259 op = &operators[sy->ops[sy->ops_count-1].etype - 1];
260 ctx = sy->ops[sy->ops_count-1].ctx;
262 if (sy->out_count < op->operands) {
263 parseerror(parser, "internal error: not enough operands: %i", sy->out_count);
269 sy->out_count -= op->operands;
270 for (i = 0; i < op->operands; ++i) {
271 exprs[i] = sy->out[sy->out_count+i].out;
272 vars[i] = sy->out[sy->out_count+i].value;
275 printf("Applying operator %s\n", op->op);
279 parseerror(parser, "internal error: unhandled operand");
283 if (exprs[0]->expression.vtype != exprs[1]->expression.vtype) {
284 parseerror(parser, "Cannot add type %s and %s",
285 type_name[exprs[0]->expression.vtype],
286 type_name[exprs[1]->expression.vtype]);
289 switch (exprs[0]->expression.vtype) {
291 out = (ast_expression*)ast_binary_new(ctx, INSTR_ADD_F, exprs[0], exprs[1]);
294 out = (ast_expression*)ast_binary_new(ctx, INSTR_ADD_V, exprs[0], exprs[1]);
297 parseerror(parser, "Cannot add type %s and %s",
298 type_name[exprs[0]->expression.vtype],
299 type_name[exprs[1]->expression.vtype]);
304 if (exprs[0]->expression.vtype != exprs[1]->expression.vtype) {
305 parseerror(parser, "Cannot subtract type %s from %s",
306 type_name[exprs[1]->expression.vtype],
307 type_name[exprs[0]->expression.vtype]);
310 switch (exprs[0]->expression.vtype) {
312 out = (ast_expression*)ast_binary_new(ctx, INSTR_SUB_F, exprs[0], exprs[1]);
315 out = (ast_expression*)ast_binary_new(ctx, INSTR_SUB_V, exprs[0], exprs[1]);
318 parseerror(parser, "Cannot add type %s from %s",
319 type_name[exprs[1]->expression.vtype],
320 type_name[exprs[0]->expression.vtype]);
325 if (exprs[0]->expression.vtype != exprs[1]->expression.vtype &&
326 exprs[0]->expression.vtype != TYPE_VECTOR &&
327 exprs[0]->expression.vtype != TYPE_FLOAT &&
328 exprs[1]->expression.vtype != TYPE_VECTOR &&
329 exprs[1]->expression.vtype != TYPE_FLOAT)
331 parseerror(parser, "Cannot multiply type %s from %s",
332 type_name[exprs[1]->expression.vtype],
333 type_name[exprs[0]->expression.vtype]);
336 switch (exprs[0]->expression.vtype) {
338 if (exprs[1]->expression.vtype == TYPE_VECTOR)
339 out = (ast_expression*)ast_binary_new(ctx, INSTR_MUL_FV, exprs[0], exprs[1]);
341 out = (ast_expression*)ast_binary_new(ctx, INSTR_MUL_F, exprs[0], exprs[1]);
344 if (exprs[1]->expression.vtype == TYPE_FLOAT)
345 out = (ast_expression*)ast_binary_new(ctx, INSTR_MUL_VF, exprs[0], exprs[1]);
347 out = (ast_expression*)ast_binary_new(ctx, INSTR_MUL_V, exprs[0], exprs[1]);
350 parseerror(parser, "Cannot add type %s from %s",
351 type_name[exprs[1]->expression.vtype],
352 type_name[exprs[0]->expression.vtype]);
357 if (exprs[0]->expression.vtype != exprs[1]->expression.vtype ||
358 exprs[0]->expression.vtype != TYPE_FLOAT)
360 parseerror(parser, "Cannot divide types %s and %s",
361 type_name[exprs[0]->expression.vtype],
362 type_name[exprs[1]->expression.vtype]);
365 out = (ast_expression*)ast_binary_new(ctx, INSTR_DIV_F, exprs[0], exprs[1]);
371 parseerror(parser, "Cannot assign to non-variable");
374 out = (ast_expression*)ast_store_new(ctx,
375 type_store_instr[vars[0]->expression.vtype],
381 parseerror(parser, "failed to apply operand %s", op->op);
385 sy->out[sy->out_count++] = syexp(ctx, out);
389 static ast_expression* parser_expression(parser_t *parser)
391 ast_expression *expr = NULL;
395 MEM_VECTOR_INIT(&sy, out);
396 MEM_VECTOR_INIT(&sy, ops);
402 bool nextwant = true;
403 if (parser->tok == TOKEN_IDENT)
406 ast_value *var = parser_find_var(parser, parser_tokval(parser));
408 parseerror(parser, "unexpected ident: %s", parser_tokval(parser));
411 if (!shunt_out_add(&sy, syval(parser_ctx(parser), var))) {
412 parseerror(parser, "out of memory");
415 printf("Added: %s\n", var->name);
417 else if (parser->tok == TOKEN_FLOATCONST) {
418 ast_value *val = parser_const_float(parser, (parser_token(parser)->constval.f));
421 if (!shunt_out_add(&sy, syexp(parser_ctx(parser), (ast_expression*)val))) {
422 parseerror(parser, "out of memory");
426 else if (parser->tok == TOKEN_INTCONST) {
427 ast_value *val = parser_const_float(parser, (double)(parser_token(parser)->constval.i));
430 if (!shunt_out_add(&sy, syexp(parser_ctx(parser), (ast_expression*)val))) {
431 parseerror(parser, "out of memory");
434 printf("Added: %i\n", parser_token(parser)->constval.i);
436 else if (parser->tok == '(') {
437 nextwant = false; /* not expecting an operator next */
438 if (!shunt_ops_add(&sy, syparen(parser_ctx(parser), 1))) {
439 parseerror(parser, "out of memory");
444 /* TODO: prefix operators */
445 parseerror(parser, "expected statement");
449 parser->lex->flags.noops = !wantop;
451 if (parser->tok == ')') {
452 /* we do expect an operator next */
453 /* closing an opening paren */
454 printf("Applying closing paren\n");
456 parseerror(parser, "unmatched closing paren");
459 if (sy.ops[sy.ops_count-1].paren == 1) {
460 parseerror(parser, "empty parenthesis expression");
463 while (sy.ops_count) {
464 if (sy.ops[sy.ops_count-1].paren == 1) {
468 if (!parser_sy_pop(parser, &sy))
472 else if (parser->tok != TOKEN_OPERATOR) {
473 parseerror(parser, "expected operator or end of statement");
477 /* classify the operator */
478 /* TODO: suffix operators */
480 const oper_info *olast = NULL;
482 for (o = 0; o < operator_count; ++o) {
483 if (!(operators[o].flags & OP_PREFIX) &&
484 !(operators[o].flags & OP_SUFFIX) && /* remove this */
485 !strcmp(parser_tokval(parser), operators[o].op))
490 if (o == operator_count) {
491 /* no operator found... must be the end of the statement */
494 /* found an operator */
497 if (sy.ops_count && !sy.ops[sy.ops_count-1].paren)
498 olast = &operators[sy.ops[sy.ops_count-1].etype-1];
501 (op->prec < olast->prec) ||
502 (op->assoc == ASSOC_LEFT && op->prec <= olast->prec) ) )
504 if (!parser_sy_pop(parser, &sy))
506 if (sy.ops_count && !sy.ops[sy.ops_count-1].paren)
507 olast = &operators[sy.ops[sy.ops_count-1].etype-1];
510 if (!shunt_ops_add(&sy, syop(parser_ctx(parser), op)))
512 printf("Added op %s\n", op->op);
515 parser->lex->flags.noops = true;
517 if (!parser_next(parser)) {
520 if (parser->tok == ';') {
521 printf("End of statement\n");
525 if (!parser_next(parser)) {
526 parseerror(parser, "Unexpected end of file");
530 while (sy.ops_count) {
531 if (!parser_sy_pop(parser, &sy))
535 parser->lex->flags.noops = true;
537 parseerror(parser, "empty expression");
540 expr = sy.out[0].out;
541 MEM_VECTOR_CLEAR(&sy, out);
542 MEM_VECTOR_CLEAR(&sy, ops);
546 parser->lex->flags.noops = true;
547 MEM_VECTOR_CLEAR(&sy, out);
548 MEM_VECTOR_CLEAR(&sy, ops);
552 static bool parser_variable(parser_t *parser, ast_block *localblock);
553 static bool parser_body_do(parser_t *parser, ast_block *block)
555 if (parser->tok == TOKEN_TYPENAME)
558 if (!parser_variable(parser, block))
562 else if (parser->tok == TOKEN_KEYWORD)
564 if (!strcmp(parser_tokval(parser), "return"))
569 if (!parser_next(parser)) {
570 parseerror(parser, "expected return expression");
574 exp = parser_expression(parser);
577 ret = ast_return_new(exp->expression.node.context, exp);
582 if (!ast_block_exprs_add(block, (ast_expression*)ret)) {
588 parseerror(parser, "Unexpected keyword");
591 else if (parser->tok == '{')
594 parseerror(parser, "TODO: inner blocks: %s", parser_tokval(parser));
599 ast_expression *exp = parser_expression(parser);
602 if (!ast_block_exprs_add(block, exp)) {
610 static ast_block* parser_parse_block(parser_t *parser)
612 size_t oldblocklocal;
613 ast_block *block = NULL;
615 oldblocklocal = parser->blocklocal;
616 parser->blocklocal = parser->locals_count;
618 if (!parser_next(parser)) { /* skip the '{' */
619 parseerror(parser, "expected function body");
623 block = ast_block_new(parser_ctx(parser));
625 while (parser->tok != TOKEN_EOF && parser->tok < TOKEN_ERROR)
627 if (parser->tok == '}')
630 if (!parser_body_do(parser, block)) {
631 ast_block_delete(block);
637 if (parser->tok != '}') {
638 ast_block_delete(block);
641 (void)parser_next(parser);
645 parser->blocklocal = oldblocklocal;
649 static bool parser_variable(parser_t *parser, ast_block *localblock)
652 ast_function *func = NULL;
656 int basetype = parser_token(parser)->constval.t;
660 if (!parser_next(parser)) { /* skip basetype or comma */
661 parseerror(parser, "expected variable declaration");
667 ctx = parser_ctx(parser);
668 var = parser_parse_type(parser, basetype, &isfunc);
673 if (parser->tok != TOKEN_IDENT) {
674 parseerror(parser, "expected variable name\n");
678 if (!localblock && parser_find_global(parser, parser_tokval(parser))) {
679 ast_value_delete(var);
680 parseerror(parser, "global already exists: %s\n", parser_tokval(parser));
684 if (localblock && parser_find_local(parser, parser_tokval(parser), parser->blocklocal)) {
685 ast_value_delete(var);
686 parseerror(parser, "local variable already exists: %s\n", parser_tokval(parser));
690 if (!ast_value_set_name(var, parser_tokval(parser))) {
691 parseerror(parser, "failed to set variable name\n");
692 ast_value_delete(var);
697 /* a function was defined */
700 /* turn var into a value of TYPE_FUNCTION, with the old var
703 fval = ast_value_new(ctx, var->name, TYPE_FUNCTION);
704 func = ast_function_new(ctx, var->name, fval);
705 if (!fval || !func) {
706 ast_value_delete(var);
707 if (fval) ast_value_delete(fval);
708 if (func) ast_function_delete(func);
712 fval->expression.next = (ast_expression*)var;
713 MEM_VECTOR_MOVE(var, params, fval, params);
715 if (!parser_t_functions_add(parser, func)) {
716 ast_value_delete(var);
717 if (fval) ast_value_delete(fval);
718 if (func) ast_function_delete(func);
725 if ( (!localblock && !parser_t_globals_add(parser, var)) ||
726 ( localblock && !parser_t_locals_add(parser, var)) )
728 ast_value_delete(var);
731 if (localblock && !ast_block_locals_add(localblock, var))
733 parser->locals_count--;
734 ast_value_delete(var);
738 if (!parser_next(parser)) {
739 ast_value_delete(var);
743 if (parser->tok == ';') {
744 if (!parser_next(parser))
745 return parser->tok == TOKEN_EOF;
749 if (parser->tok == ',') {
754 if (parser->tok != '=') {
755 parseerror(parser, "expected '=' or ';'");
759 if (!parser_next(parser))
762 if (parser->tok == '#') {
764 parseerror(parser, "cannot declare builtins within functions");
767 if (!isfunc || !func) {
768 parseerror(parser, "unexpected builtin number, '%s' is not a function", var->name);
771 if (!parser_next(parser)) {
772 parseerror(parser, "expected builtin number");
775 if (parser->tok != TOKEN_INTCONST) {
776 parseerror(parser, "builtin number must be an integer constant");
779 if (parser_token(parser)->constval.i <= 0) {
780 parseerror(parser, "builtin number must be positive integer greater than zero");
784 func->builtin = -parser_token(parser)->constval.i;
785 } else if (parser->tok == '{') {
788 ast_function *old = parser->function;
791 parseerror(parser, "cannot declare functions within functions");
795 parser->function = func;
796 block = parser_parse_block(parser);
797 parser->function = old;
802 if (!ast_function_blocks_add(func, block)) {
803 ast_block_delete(block);
808 parseerror(parser, "TODO, const assignment");
811 if (!parser_next(parser))
814 if (parser->tok == ',') {
819 if (parser->tok != ';') {
820 parseerror(parser, "expected semicolon");
824 (void)parser_next(parser);
830 static bool parser_do(parser_t *parser)
832 if (parser->tok == TOKEN_TYPENAME)
834 return parser_variable(parser, NULL);
836 else if (parser->tok == TOKEN_KEYWORD)
838 /* handle 'var' and 'const' */
841 else if (parser->tok == '.')
843 /* entity-member declaration */
848 parseerror(parser, "unexpected token: %s", parser->lex->tok->value);
854 bool parser_compile(const char *filename)
860 parser = (parser_t*)mem_a(sizeof(parser_t));
864 memset(parser, 0, sizeof(parser));
866 MEM_VECTOR_INIT(parser, globals);
867 MEM_VECTOR_INIT(parser, locals);
868 parser->lex = lex_open(filename);
871 printf("failed to open file \"%s\"\n", filename);
875 /* initial lexer/parser state */
876 parser->lex->flags.noops = true;
878 if (parser_next(parser))
880 while (parser->tok != TOKEN_EOF && parser->tok < TOKEN_ERROR)
882 if (!parser_do(parser)) {
883 if (parser->tok == TOKEN_EOF)
884 parseerror(parser, "unexpected eof");
886 parseerror(parser, "parse error\n");
887 lex_close(parser->lex);
894 lex_close(parser->lex);
896 ir = ir_builder_new("gmqcc_out");
898 printf("failed to allocate builder\n");
902 for (i = 0; i < parser->imm_float_count; ++i) {
903 if (!ast_global_codegen(parser->imm_float[i], ir)) {
904 printf("failed to generate global %s\n", parser->imm_float[i]->name);
907 for (i = 0; i < parser->globals_count; ++i) {
908 if (!ast_global_codegen(parser->globals[i], ir)) {
909 printf("failed to generate global %s\n", parser->globals[i]->name);
912 for (i = 0; i < parser->functions_count; ++i) {
913 if (!ast_function_codegen(parser->functions[i], ir)) {
914 printf("failed to generate function %s\n", parser->functions[i]->name);
916 if (!ir_function_finalize(parser->functions[i]->ir_func)) {
917 printf("failed to finalize function %s\n", parser->functions[i]->name);
921 ir_builder_dump(ir, printf);
924 for (i = 0; i < parser->globals_count; ++i) {
925 ast_value_delete(parser->globals[i]);
927 MEM_VECTOR_CLEAR(parser, globals);