5 * Permission is hereby granted, free of charge, to any person obtaining a copy of
6 * this software and associated documentation files (the "Software"), to deal in
7 * the Software without restriction, including without limitation the rights to
8 * use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is furnished to do
10 * so, subject to the following conditions:
12 * The above copyright notice and this permission notice shall be included in all
13 * copies or substantial portions of the Software.
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
28 /***********************************************************************
29 * Type sizes used at multiple points in the IR codegen
32 const char *type_name[TYPE_COUNT] = {
50 size_t type_sizeof_[TYPE_COUNT] = {
57 1, /* TYPE_FUNCTION */
67 uint16_t type_store_instr[TYPE_COUNT] = {
68 INSTR_STORE_F, /* should use I when having integer support */
75 INSTR_STORE_ENT, /* should use I */
77 INSTR_STORE_I, /* integer type */
82 INSTR_STORE_V, /* variant, should never be accessed */
84 AINSTR_END, /* struct */
85 AINSTR_END, /* union */
86 AINSTR_END, /* array */
90 uint16_t field_store_instr[TYPE_COUNT] = {
100 INSTR_STORE_FLD, /* integer type */
105 INSTR_STORE_V, /* variant, should never be accessed */
107 AINSTR_END, /* struct */
108 AINSTR_END, /* union */
109 AINSTR_END, /* array */
110 AINSTR_END, /* nil */
113 uint16_t type_storep_instr[TYPE_COUNT] = {
114 INSTR_STOREP_F, /* should use I when having integer support */
121 INSTR_STOREP_ENT, /* should use I */
123 INSTR_STOREP_ENT, /* integer type */
128 INSTR_STOREP_V, /* variant, should never be accessed */
130 AINSTR_END, /* struct */
131 AINSTR_END, /* union */
132 AINSTR_END, /* array */
133 AINSTR_END, /* nil */
136 uint16_t type_eq_instr[TYPE_COUNT] = {
137 INSTR_EQ_F, /* should use I when having integer support */
142 INSTR_EQ_E, /* FLD has no comparison */
144 INSTR_EQ_E, /* should use I */
151 INSTR_EQ_V, /* variant, should never be accessed */
153 AINSTR_END, /* struct */
154 AINSTR_END, /* union */
155 AINSTR_END, /* array */
156 AINSTR_END, /* nil */
159 uint16_t type_ne_instr[TYPE_COUNT] = {
160 INSTR_NE_F, /* should use I when having integer support */
165 INSTR_NE_E, /* FLD has no comparison */
167 INSTR_NE_E, /* should use I */
174 INSTR_NE_V, /* variant, should never be accessed */
176 AINSTR_END, /* struct */
177 AINSTR_END, /* union */
178 AINSTR_END, /* array */
179 AINSTR_END, /* nil */
182 uint16_t type_not_instr[TYPE_COUNT] = {
183 INSTR_NOT_F, /* should use I when having integer support */
190 INSTR_NOT_ENT, /* should use I */
192 INSTR_NOT_I, /* integer type */
197 INSTR_NOT_V, /* variant, should never be accessed */
199 AINSTR_END, /* struct */
200 AINSTR_END, /* union */
201 AINSTR_END, /* array */
202 AINSTR_END, /* nil */
206 static ir_value* ir_gen_extparam_proto(ir_builder *ir);
207 static void ir_gen_extparam (ir_builder *ir);
209 /* error functions */
211 static void irerror(lex_ctx ctx, const char *msg, ...)
215 con_cvprintmsg((void*)&ctx, LVL_ERROR, "internal error", msg, ap);
219 static bool irwarning(lex_ctx ctx, int warntype, const char *fmt, ...)
224 r = vcompile_warning(ctx, warntype, fmt, ap);
229 /***********************************************************************
230 * Vector utility functions
233 bool GMQCC_WARN vec_ir_value_find(ir_value **vec, const ir_value *what, size_t *idx)
236 size_t len = vec_size(vec);
237 for (i = 0; i < len; ++i) {
238 if (vec[i] == what) {
246 bool GMQCC_WARN vec_ir_block_find(ir_block **vec, ir_block *what, size_t *idx)
249 size_t len = vec_size(vec);
250 for (i = 0; i < len; ++i) {
251 if (vec[i] == what) {
259 bool GMQCC_WARN vec_ir_instr_find(ir_instr **vec, ir_instr *what, size_t *idx)
262 size_t len = vec_size(vec);
263 for (i = 0; i < len; ++i) {
264 if (vec[i] == what) {
272 /***********************************************************************
276 static void ir_block_delete_quick(ir_block* self);
277 static void ir_instr_delete_quick(ir_instr *self);
278 static void ir_function_delete_quick(ir_function *self);
280 ir_builder* ir_builder_new(const char *modulename)
284 self = (ir_builder*)mem_a(sizeof(*self));
288 self->functions = NULL;
289 self->globals = NULL;
291 self->filenames = NULL;
292 self->filestrings = NULL;
293 self->htglobals = util_htnew(IR_HT_SIZE);
294 self->htfields = util_htnew(IR_HT_SIZE);
295 self->htfunctions = util_htnew(IR_HT_SIZE);
297 self->extparams = NULL;
298 self->extparam_protos = NULL;
300 self->first_common_globaltemp = 0;
301 self->max_globaltemps = 0;
302 self->first_common_local = 0;
303 self->max_locals = 0;
305 self->str_immediate = 0;
307 if (!ir_builder_set_name(self, modulename)) {
312 self->nil = ir_value_var("nil", store_value, TYPE_NIL);
313 self->nil->cvq = CV_CONST;
318 void ir_builder_delete(ir_builder* self)
321 util_htdel(self->htglobals);
322 util_htdel(self->htfields);
323 util_htdel(self->htfunctions);
324 mem_d((void*)self->name);
325 for (i = 0; i != vec_size(self->functions); ++i) {
326 ir_function_delete_quick(self->functions[i]);
328 vec_free(self->functions);
329 for (i = 0; i != vec_size(self->extparams); ++i) {
330 ir_value_delete(self->extparams[i]);
332 vec_free(self->extparams);
333 for (i = 0; i != vec_size(self->globals); ++i) {
334 ir_value_delete(self->globals[i]);
336 vec_free(self->globals);
337 for (i = 0; i != vec_size(self->fields); ++i) {
338 ir_value_delete(self->fields[i]);
340 ir_value_delete(self->nil);
341 vec_free(self->fields);
342 vec_free(self->filenames);
343 vec_free(self->filestrings);
347 bool ir_builder_set_name(ir_builder *self, const char *name)
350 mem_d((void*)self->name);
351 self->name = util_strdup(name);
355 ir_function* ir_builder_get_function(ir_builder *self, const char *name)
357 return (ir_function*)util_htget(self->htfunctions, name);
360 ir_function* ir_builder_create_function(ir_builder *self, const char *name, int outtype)
362 ir_function *fn = ir_builder_get_function(self, name);
367 fn = ir_function_new(self, outtype);
368 if (!ir_function_set_name(fn, name))
370 ir_function_delete(fn);
373 vec_push(self->functions, fn);
374 util_htset(self->htfunctions, name, fn);
376 fn->value = ir_builder_create_global(self, fn->name, TYPE_FUNCTION);
378 ir_function_delete(fn);
382 fn->value->hasvalue = true;
383 fn->value->outtype = outtype;
384 fn->value->constval.vfunc = fn;
385 fn->value->context = fn->context;
390 ir_value* ir_builder_get_global(ir_builder *self, const char *name)
392 return (ir_value*)util_htget(self->htglobals, name);
395 ir_value* ir_builder_create_global(ir_builder *self, const char *name, int vtype)
399 if (name && name[0] != '#')
401 ve = ir_builder_get_global(self, name);
407 ve = ir_value_var(name, store_global, vtype);
408 vec_push(self->globals, ve);
409 util_htset(self->htglobals, name, ve);
413 ir_value* ir_builder_get_field(ir_builder *self, const char *name)
415 return (ir_value*)util_htget(self->htfields, name);
419 ir_value* ir_builder_create_field(ir_builder *self, const char *name, int vtype)
421 ir_value *ve = ir_builder_get_field(self, name);
426 ve = ir_value_var(name, store_global, TYPE_FIELD);
427 ve->fieldtype = vtype;
428 vec_push(self->fields, ve);
429 util_htset(self->htfields, name, ve);
433 /***********************************************************************
437 bool ir_function_naive_phi(ir_function*);
438 void ir_function_enumerate(ir_function*);
439 bool ir_function_calculate_liferanges(ir_function*);
440 bool ir_function_allocate_locals(ir_function*);
442 ir_function* ir_function_new(ir_builder* owner, int outtype)
445 self = (ir_function*)mem_a(sizeof(*self));
450 memset(self, 0, sizeof(*self));
453 if (!ir_function_set_name(self, "<@unnamed>")) {
460 self->context.file = "<@no context>";
461 self->context.line = 0;
462 self->outtype = outtype;
471 self->code_function_def = -1;
472 self->allocated_locals = 0;
473 self->globaltemps = 0;
479 bool ir_function_set_name(ir_function *self, const char *name)
482 mem_d((void*)self->name);
483 self->name = util_strdup(name);
487 static void ir_function_delete_quick(ir_function *self)
490 mem_d((void*)self->name);
492 for (i = 0; i != vec_size(self->blocks); ++i)
493 ir_block_delete_quick(self->blocks[i]);
494 vec_free(self->blocks);
496 vec_free(self->params);
498 for (i = 0; i != vec_size(self->values); ++i)
499 ir_value_delete(self->values[i]);
500 vec_free(self->values);
502 for (i = 0; i != vec_size(self->locals); ++i)
503 ir_value_delete(self->locals[i]);
504 vec_free(self->locals);
506 /* self->value is deleted by the builder */
511 void ir_function_delete(ir_function *self)
514 mem_d((void*)self->name);
516 for (i = 0; i != vec_size(self->blocks); ++i)
517 ir_block_delete(self->blocks[i]);
518 vec_free(self->blocks);
520 vec_free(self->params);
522 for (i = 0; i != vec_size(self->values); ++i)
523 ir_value_delete(self->values[i]);
524 vec_free(self->values);
526 for (i = 0; i != vec_size(self->locals); ++i)
527 ir_value_delete(self->locals[i]);
528 vec_free(self->locals);
530 /* self->value is deleted by the builder */
535 void ir_function_collect_value(ir_function *self, ir_value *v)
537 vec_push(self->values, v);
540 ir_block* ir_function_create_block(lex_ctx ctx, ir_function *self, const char *label)
542 ir_block* bn = ir_block_new(self, label);
544 vec_push(self->blocks, bn);
548 static bool instr_is_operation(uint16_t op)
550 return ( (op >= INSTR_MUL_F && op <= INSTR_GT) ||
551 (op >= INSTR_LOAD_F && op <= INSTR_LOAD_FNC) ||
552 (op == INSTR_ADDRESS) ||
553 (op >= INSTR_NOT_F && op <= INSTR_NOT_FNC) ||
554 (op >= INSTR_AND && op <= INSTR_BITOR) ||
555 (op >= INSTR_CALL0 && op <= INSTR_CALL8) );
558 bool ir_function_pass_peephole(ir_function *self)
562 for (b = 0; b < vec_size(self->blocks); ++b) {
564 ir_block *block = self->blocks[b];
566 for (i = 0; i < vec_size(block->instr); ++i) {
568 inst = block->instr[i];
571 (inst->opcode >= INSTR_STORE_F &&
572 inst->opcode <= INSTR_STORE_FNC))
580 oper = block->instr[i-1];
581 if (!instr_is_operation(oper->opcode))
584 value = oper->_ops[0];
586 /* only do it for SSA values */
587 if (value->store != store_value)
590 /* don't optimize out the temp if it's used later again */
591 if (vec_size(value->reads) != 1)
594 /* The very next store must use this value */
595 if (value->reads[0] != store)
598 /* And of course the store must _read_ from it, so it's in
600 if (store->_ops[1] != value)
603 ++opts_optimizationcount[OPTIM_PEEPHOLE];
604 (void)!ir_instr_op(oper, 0, store->_ops[0], true);
606 vec_remove(block->instr, i, 1);
607 ir_instr_delete(store);
609 else if (inst->opcode == VINSTR_COND)
611 /* COND on a value resulting from a NOT could
612 * remove the NOT and swap its operands
619 value = inst->_ops[0];
621 if (value->store != store_value ||
622 vec_size(value->reads) != 1 ||
623 value->reads[0] != inst)
628 inot = value->writes[0];
629 if (inot->_ops[0] != value ||
630 inot->opcode < INSTR_NOT_F ||
631 inot->opcode > INSTR_NOT_FNC ||
632 inot->opcode == INSTR_NOT_V || /* can't do these */
633 inot->opcode == INSTR_NOT_S)
639 ++opts_optimizationcount[OPTIM_PEEPHOLE];
641 (void)!ir_instr_op(inst, 0, inot->_ops[1], false);
644 for (inotid = 0; inotid < vec_size(tmp->instr); ++inotid) {
645 if (tmp->instr[inotid] == inot)
648 if (inotid >= vec_size(tmp->instr)) {
649 compile_error(inst->context, "sanity-check failed: failed to find instruction to optimize out");
652 vec_remove(tmp->instr, inotid, 1);
653 ir_instr_delete(inot);
654 /* swap ontrue/onfalse */
656 inst->bops[0] = inst->bops[1];
667 bool ir_function_pass_tailrecursion(ir_function *self)
671 for (b = 0; b < vec_size(self->blocks); ++b) {
673 ir_instr *ret, *call, *store = NULL;
674 ir_block *block = self->blocks[b];
676 if (!block->final || vec_size(block->instr) < 2)
679 ret = block->instr[vec_size(block->instr)-1];
680 if (ret->opcode != INSTR_DONE && ret->opcode != INSTR_RETURN)
683 call = block->instr[vec_size(block->instr)-2];
684 if (call->opcode >= INSTR_STORE_F && call->opcode <= INSTR_STORE_FNC) {
685 /* account for the unoptimized
687 * STORE %return, %tmp
691 if (vec_size(block->instr) < 3)
695 call = block->instr[vec_size(block->instr)-3];
698 if (call->opcode < INSTR_CALL0 || call->opcode > INSTR_CALL8)
702 /* optimize out the STORE */
704 ret->_ops[0] == store->_ops[0] &&
705 store->_ops[1] == call->_ops[0])
707 ++opts_optimizationcount[OPTIM_PEEPHOLE];
708 call->_ops[0] = store->_ops[0];
709 vec_remove(block->instr, vec_size(block->instr) - 2, 1);
710 ir_instr_delete(store);
719 funcval = call->_ops[1];
722 if (funcval->vtype != TYPE_FUNCTION || funcval->constval.vfunc != self)
725 /* now we have a CALL and a RET, check if it's a tailcall */
726 if (ret->_ops[0] && call->_ops[0] != ret->_ops[0])
729 ++opts_optimizationcount[OPTIM_TAIL_RECURSION];
730 vec_shrinkby(block->instr, 2);
732 block->final = false; /* open it back up */
734 /* emite parameter-stores */
735 for (p = 0; p < vec_size(call->params); ++p) {
736 /* assert(call->params_count <= self->locals_count); */
737 if (!ir_block_create_store(block, call->context, self->locals[p], call->params[p])) {
738 irerror(call->context, "failed to create tailcall store instruction for parameter %i", (int)p);
742 if (!ir_block_create_jump(block, call->context, self->blocks[0])) {
743 irerror(call->context, "failed to create tailcall jump");
747 ir_instr_delete(call);
748 ir_instr_delete(ret);
754 bool ir_function_finalize(ir_function *self)
761 if (OPTS_OPTIMIZATION(OPTIM_PEEPHOLE)) {
762 if (!ir_function_pass_peephole(self)) {
763 irerror(self->context, "generic optimization pass broke something in `%s`", self->name);
768 if (OPTS_OPTIMIZATION(OPTIM_TAIL_RECURSION)) {
769 if (!ir_function_pass_tailrecursion(self)) {
770 irerror(self->context, "tail-recursion optimization pass broke something in `%s`", self->name);
775 if (!ir_function_naive_phi(self))
778 for (i = 0; i < vec_size(self->locals); ++i) {
779 ir_value *v = self->locals[i];
780 if (v->vtype == TYPE_VECTOR ||
781 (v->vtype == TYPE_FIELD && v->outtype == TYPE_VECTOR))
783 ir_value_vector_member(v, 0);
784 ir_value_vector_member(v, 1);
785 ir_value_vector_member(v, 2);
788 for (i = 0; i < vec_size(self->values); ++i) {
789 ir_value *v = self->values[i];
790 if (v->vtype == TYPE_VECTOR ||
791 (v->vtype == TYPE_FIELD && v->outtype == TYPE_VECTOR))
793 ir_value_vector_member(v, 0);
794 ir_value_vector_member(v, 1);
795 ir_value_vector_member(v, 2);
799 ir_function_enumerate(self);
801 if (!ir_function_calculate_liferanges(self))
803 if (!ir_function_allocate_locals(self))
808 ir_value* ir_function_create_local(ir_function *self, const char *name, int vtype, bool param)
813 vec_size(self->locals) &&
814 self->locals[vec_size(self->locals)-1]->store != store_param) {
815 irerror(self->context, "cannot add parameters after adding locals");
819 ve = ir_value_var(name, (param ? store_param : store_local), vtype);
822 vec_push(self->locals, ve);
826 /***********************************************************************
830 ir_block* ir_block_new(ir_function* owner, const char *name)
833 self = (ir_block*)mem_a(sizeof(*self));
837 memset(self, 0, sizeof(*self));
840 if (name && !ir_block_set_label(self, name)) {
845 self->context.file = "<@no context>";
846 self->context.line = 0;
850 self->entries = NULL;
854 self->is_return = false;
859 self->generated = false;
864 static void ir_block_delete_quick(ir_block* self)
867 if (self->label) mem_d(self->label);
868 for (i = 0; i != vec_size(self->instr); ++i)
869 ir_instr_delete_quick(self->instr[i]);
870 vec_free(self->instr);
871 vec_free(self->entries);
872 vec_free(self->exits);
873 vec_free(self->living);
877 void ir_block_delete(ir_block* self)
880 if (self->label) mem_d(self->label);
881 for (i = 0; i != vec_size(self->instr); ++i)
882 ir_instr_delete(self->instr[i]);
883 vec_free(self->instr);
884 vec_free(self->entries);
885 vec_free(self->exits);
886 vec_free(self->living);
890 bool ir_block_set_label(ir_block *self, const char *name)
893 mem_d((void*)self->label);
894 self->label = util_strdup(name);
895 return !!self->label;
898 /***********************************************************************
902 ir_instr* ir_instr_new(lex_ctx ctx, ir_block* owner, int op)
905 self = (ir_instr*)mem_a(sizeof(*self));
912 self->_ops[0] = NULL;
913 self->_ops[1] = NULL;
914 self->_ops[2] = NULL;
915 self->bops[0] = NULL;
916 self->bops[1] = NULL;
927 static void ir_instr_delete_quick(ir_instr *self)
930 vec_free(self->params);
934 void ir_instr_delete(ir_instr *self)
937 /* The following calls can only delete from
938 * vectors, we still want to delete this instruction
939 * so ignore the return value. Since with the warn_unused_result attribute
940 * gcc doesn't care about an explicit: (void)foo(); to ignore the result,
941 * I have to improvise here and use if(foo());
943 for (i = 0; i < vec_size(self->phi); ++i) {
945 if (vec_ir_instr_find(self->phi[i].value->writes, self, &idx))
946 vec_remove(self->phi[i].value->writes, idx, 1);
947 if (vec_ir_instr_find(self->phi[i].value->reads, self, &idx))
948 vec_remove(self->phi[i].value->reads, idx, 1);
951 for (i = 0; i < vec_size(self->params); ++i) {
953 if (vec_ir_instr_find(self->params[i]->writes, self, &idx))
954 vec_remove(self->params[i]->writes, idx, 1);
955 if (vec_ir_instr_find(self->params[i]->reads, self, &idx))
956 vec_remove(self->params[i]->reads, idx, 1);
958 vec_free(self->params);
959 (void)!ir_instr_op(self, 0, NULL, false);
960 (void)!ir_instr_op(self, 1, NULL, false);
961 (void)!ir_instr_op(self, 2, NULL, false);
965 bool ir_instr_op(ir_instr *self, int op, ir_value *v, bool writing)
967 if (self->_ops[op]) {
969 if (writing && vec_ir_instr_find(self->_ops[op]->writes, self, &idx))
970 vec_remove(self->_ops[op]->writes, idx, 1);
971 else if (vec_ir_instr_find(self->_ops[op]->reads, self, &idx))
972 vec_remove(self->_ops[op]->reads, idx, 1);
976 vec_push(v->writes, self);
978 vec_push(v->reads, self);
984 /***********************************************************************
988 void ir_value_code_setaddr(ir_value *self, int32_t gaddr)
990 self->code.globaladdr = gaddr;
991 if (self->members[0]) self->members[0]->code.globaladdr = gaddr;
992 if (self->members[1]) self->members[1]->code.globaladdr = gaddr;
993 if (self->members[2]) self->members[2]->code.globaladdr = gaddr;
996 int32_t ir_value_code_addr(const ir_value *self)
998 if (self->store == store_return)
999 return OFS_RETURN + self->code.addroffset;
1000 return self->code.globaladdr + self->code.addroffset;
1003 ir_value* ir_value_var(const char *name, int storetype, int vtype)
1006 self = (ir_value*)mem_a(sizeof(*self));
1007 self->vtype = vtype;
1008 self->fieldtype = TYPE_VOID;
1009 self->outtype = TYPE_VOID;
1010 self->store = storetype;
1013 self->writes = NULL;
1015 self->cvq = CV_NONE;
1016 self->hasvalue = false;
1017 self->context.file = "<@no context>";
1018 self->context.line = 0;
1020 if (name && !ir_value_set_name(self, name)) {
1021 irerror(self->context, "out of memory");
1026 memset(&self->constval, 0, sizeof(self->constval));
1027 memset(&self->code, 0, sizeof(self->code));
1029 self->members[0] = NULL;
1030 self->members[1] = NULL;
1031 self->members[2] = NULL;
1032 self->memberof = NULL;
1034 self->unique_life = false;
1035 self->locked = false;
1036 self->callparam = false;
1042 ir_value* ir_value_vector_member(ir_value *self, unsigned int member)
1050 if (self->members[member])
1051 return self->members[member];
1054 len = strlen(self->name);
1055 name = (char*)mem_a(len + 3);
1056 memcpy(name, self->name, len);
1058 name[len+1] = 'x' + member;
1064 if (self->vtype == TYPE_VECTOR)
1066 m = ir_value_var(name, self->store, TYPE_FLOAT);
1071 m->context = self->context;
1073 self->members[member] = m;
1074 m->code.addroffset = member;
1076 else if (self->vtype == TYPE_FIELD)
1078 if (self->fieldtype != TYPE_VECTOR)
1080 m = ir_value_var(name, self->store, TYPE_FIELD);
1085 m->fieldtype = TYPE_FLOAT;
1086 m->context = self->context;
1088 self->members[member] = m;
1089 m->code.addroffset = member;
1093 irerror(self->context, "invalid member access on %s", self->name);
1101 static GMQCC_INLINE size_t ir_value_sizeof(const ir_value *self)
1103 if (self->vtype == TYPE_FIELD && self->fieldtype == TYPE_VECTOR)
1104 return type_sizeof_[TYPE_VECTOR];
1105 return type_sizeof_[self->vtype];
1108 ir_value* ir_value_out(ir_function *owner, const char *name, int storetype, int vtype)
1110 ir_value *v = ir_value_var(name, storetype, vtype);
1113 ir_function_collect_value(owner, v);
1117 void ir_value_delete(ir_value* self)
1121 mem_d((void*)self->name);
1124 if (self->vtype == TYPE_STRING)
1125 mem_d((void*)self->constval.vstring);
1127 for (i = 0; i < 3; ++i) {
1128 if (self->members[i])
1129 ir_value_delete(self->members[i]);
1131 vec_free(self->reads);
1132 vec_free(self->writes);
1133 vec_free(self->life);
1137 bool ir_value_set_name(ir_value *self, const char *name)
1140 mem_d((void*)self->name);
1141 self->name = util_strdup(name);
1142 return !!self->name;
1145 bool ir_value_set_float(ir_value *self, float f)
1147 if (self->vtype != TYPE_FLOAT)
1149 self->constval.vfloat = f;
1150 self->hasvalue = true;
1154 bool ir_value_set_func(ir_value *self, int f)
1156 if (self->vtype != TYPE_FUNCTION)
1158 self->constval.vint = f;
1159 self->hasvalue = true;
1163 bool ir_value_set_vector(ir_value *self, vector v)
1165 if (self->vtype != TYPE_VECTOR)
1167 self->constval.vvec = v;
1168 self->hasvalue = true;
1172 bool ir_value_set_field(ir_value *self, ir_value *fld)
1174 if (self->vtype != TYPE_FIELD)
1176 self->constval.vpointer = fld;
1177 self->hasvalue = true;
1181 static char *ir_strdup(const char *str)
1184 /* actually dup empty strings */
1185 char *out = (char*)mem_a(1);
1189 return util_strdup(str);
1192 bool ir_value_set_string(ir_value *self, const char *str)
1194 if (self->vtype != TYPE_STRING)
1196 self->constval.vstring = ir_strdup(str);
1197 self->hasvalue = true;
1202 bool ir_value_set_int(ir_value *self, int i)
1204 if (self->vtype != TYPE_INTEGER)
1206 self->constval.vint = i;
1207 self->hasvalue = true;
1212 bool ir_value_lives(ir_value *self, size_t at)
1215 for (i = 0; i < vec_size(self->life); ++i)
1217 ir_life_entry_t *life = &self->life[i];
1218 if (life->start <= at && at <= life->end)
1220 if (life->start > at) /* since it's ordered */
1226 bool ir_value_life_insert(ir_value *self, size_t idx, ir_life_entry_t e)
1229 vec_push(self->life, e);
1230 for (k = vec_size(self->life)-1; k > idx; --k)
1231 self->life[k] = self->life[k-1];
1232 self->life[idx] = e;
1236 bool ir_value_life_merge(ir_value *self, size_t s)
1239 ir_life_entry_t *life = NULL;
1240 ir_life_entry_t *before = NULL;
1241 ir_life_entry_t new_entry;
1243 /* Find the first range >= s */
1244 for (i = 0; i < vec_size(self->life); ++i)
1247 life = &self->life[i];
1248 if (life->start > s)
1251 /* nothing found? append */
1252 if (i == vec_size(self->life)) {
1254 if (life && life->end+1 == s)
1256 /* previous life range can be merged in */
1260 if (life && life->end >= s)
1262 e.start = e.end = s;
1263 vec_push(self->life, e);
1269 if (before->end + 1 == s &&
1270 life->start - 1 == s)
1273 before->end = life->end;
1274 vec_remove(self->life, i, 1);
1277 if (before->end + 1 == s)
1283 /* already contained */
1284 if (before->end >= s)
1288 if (life->start - 1 == s)
1293 /* insert a new entry */
1294 new_entry.start = new_entry.end = s;
1295 return ir_value_life_insert(self, i, new_entry);
1298 bool ir_value_life_merge_into(ir_value *self, const ir_value *other)
1302 if (!vec_size(other->life))
1305 if (!vec_size(self->life)) {
1306 size_t count = vec_size(other->life);
1307 ir_life_entry_t *life = vec_add(self->life, count);
1308 memcpy(life, other->life, count * sizeof(*life));
1313 for (i = 0; i < vec_size(other->life); ++i)
1315 const ir_life_entry_t *life = &other->life[i];
1318 ir_life_entry_t *entry = &self->life[myi];
1320 if (life->end+1 < entry->start)
1322 /* adding an interval before entry */
1323 if (!ir_value_life_insert(self, myi, *life))
1329 if (life->start < entry->start &&
1330 life->end+1 >= entry->start)
1332 /* starts earlier and overlaps */
1333 entry->start = life->start;
1336 if (life->end > entry->end &&
1337 life->start <= entry->end+1)
1339 /* ends later and overlaps */
1340 entry->end = life->end;
1343 /* see if our change combines it with the next ranges */
1344 while (myi+1 < vec_size(self->life) &&
1345 entry->end+1 >= self->life[1+myi].start)
1347 /* overlaps with (myi+1) */
1348 if (entry->end < self->life[1+myi].end)
1349 entry->end = self->life[1+myi].end;
1350 vec_remove(self->life, myi+1, 1);
1351 entry = &self->life[myi];
1354 /* see if we're after the entry */
1355 if (life->start > entry->end)
1358 /* append if we're at the end */
1359 if (myi >= vec_size(self->life)) {
1360 vec_push(self->life, *life);
1363 /* otherweise check the next range */
1372 bool ir_values_overlap(const ir_value *a, const ir_value *b)
1374 /* For any life entry in A see if it overlaps with
1375 * any life entry in B.
1376 * Note that the life entries are orderes, so we can make a
1377 * more efficient algorithm there than naively translating the
1381 ir_life_entry_t *la, *lb, *enda, *endb;
1383 /* first of all, if either has no life range, they cannot clash */
1384 if (!vec_size(a->life) || !vec_size(b->life))
1389 enda = la + vec_size(a->life);
1390 endb = lb + vec_size(b->life);
1393 /* check if the entries overlap, for that,
1394 * both must start before the other one ends.
1396 if (la->start < lb->end &&
1397 lb->start < la->end)
1402 /* entries are ordered
1403 * one entry is earlier than the other
1404 * that earlier entry will be moved forward
1406 if (la->start < lb->start)
1408 /* order: A B, move A forward
1409 * check if we hit the end with A
1414 else /* if (lb->start < la->start) actually <= */
1416 /* order: B A, move B forward
1417 * check if we hit the end with B
1426 /***********************************************************************
1430 static bool ir_check_unreachable(ir_block *self)
1432 /* The IR should never have to deal with unreachable code */
1433 if (!self->final/* || OPTS_FLAG(ALLOW_UNREACHABLE_CODE)*/)
1435 irerror(self->context, "unreachable statement (%s)", self->label);
1439 bool ir_block_create_store_op(ir_block *self, lex_ctx ctx, int op, ir_value *target, ir_value *what)
1442 if (!ir_check_unreachable(self))
1445 if (target->store == store_value &&
1446 (op < INSTR_STOREP_F || op > INSTR_STOREP_FNC))
1448 irerror(self->context, "cannot store to an SSA value");
1449 irerror(self->context, "trying to store: %s <- %s", target->name, what->name);
1450 irerror(self->context, "instruction: %s", asm_instr[op].m);
1454 in = ir_instr_new(ctx, self, op);
1458 if (!ir_instr_op(in, 0, target, (op < INSTR_STOREP_F || op > INSTR_STOREP_FNC)) ||
1459 !ir_instr_op(in, 1, what, false))
1461 ir_instr_delete(in);
1464 vec_push(self->instr, in);
1468 bool ir_block_create_store(ir_block *self, lex_ctx ctx, ir_value *target, ir_value *what)
1472 if (target->vtype == TYPE_VARIANT)
1473 vtype = what->vtype;
1475 vtype = target->vtype;
1478 if (vtype == TYPE_FLOAT && what->vtype == TYPE_INTEGER)
1479 op = INSTR_CONV_ITOF;
1480 else if (vtype == TYPE_INTEGER && what->vtype == TYPE_FLOAT)
1481 op = INSTR_CONV_FTOI;
1483 op = type_store_instr[vtype];
1485 if (OPTS_FLAG(ADJUST_VECTOR_FIELDS)) {
1486 if (op == INSTR_STORE_FLD && what->fieldtype == TYPE_VECTOR)
1490 return ir_block_create_store_op(self, ctx, op, target, what);
1493 bool ir_block_create_storep(ir_block *self, lex_ctx ctx, ir_value *target, ir_value *what)
1498 if (target->vtype != TYPE_POINTER)
1501 /* storing using pointer - target is a pointer, type must be
1502 * inferred from source
1504 vtype = what->vtype;
1506 op = type_storep_instr[vtype];
1507 if (OPTS_FLAG(ADJUST_VECTOR_FIELDS)) {
1508 if (op == INSTR_STOREP_FLD && what->fieldtype == TYPE_VECTOR)
1509 op = INSTR_STOREP_V;
1512 return ir_block_create_store_op(self, ctx, op, target, what);
1515 bool ir_block_create_return(ir_block *self, lex_ctx ctx, ir_value *v)
1518 if (!ir_check_unreachable(self))
1521 self->is_return = true;
1522 in = ir_instr_new(ctx, self, INSTR_RETURN);
1526 if (v && !ir_instr_op(in, 0, v, false)) {
1527 ir_instr_delete(in);
1531 vec_push(self->instr, in);
1535 bool ir_block_create_if(ir_block *self, lex_ctx ctx, ir_value *v,
1536 ir_block *ontrue, ir_block *onfalse)
1539 if (!ir_check_unreachable(self))
1542 /*in = ir_instr_new(ctx, self, (v->vtype == TYPE_STRING ? INSTR_IF_S : INSTR_IF_F));*/
1543 in = ir_instr_new(ctx, self, VINSTR_COND);
1547 if (!ir_instr_op(in, 0, v, false)) {
1548 ir_instr_delete(in);
1552 in->bops[0] = ontrue;
1553 in->bops[1] = onfalse;
1555 vec_push(self->instr, in);
1557 vec_push(self->exits, ontrue);
1558 vec_push(self->exits, onfalse);
1559 vec_push(ontrue->entries, self);
1560 vec_push(onfalse->entries, self);
1564 bool ir_block_create_jump(ir_block *self, lex_ctx ctx, ir_block *to)
1567 if (!ir_check_unreachable(self))
1570 in = ir_instr_new(ctx, self, VINSTR_JUMP);
1575 vec_push(self->instr, in);
1577 vec_push(self->exits, to);
1578 vec_push(to->entries, self);
1582 bool ir_block_create_goto(ir_block *self, lex_ctx ctx, ir_block *to)
1584 self->owner->flags |= IR_FLAG_HAS_GOTO;
1585 return ir_block_create_jump(self, ctx, to);
1588 ir_instr* ir_block_create_phi(ir_block *self, lex_ctx ctx, const char *label, int ot)
1592 if (!ir_check_unreachable(self))
1594 in = ir_instr_new(ctx, self, VINSTR_PHI);
1597 out = ir_value_out(self->owner, label, store_value, ot);
1599 ir_instr_delete(in);
1602 if (!ir_instr_op(in, 0, out, true)) {
1603 ir_instr_delete(in);
1604 ir_value_delete(out);
1607 vec_push(self->instr, in);
1611 ir_value* ir_phi_value(ir_instr *self)
1613 return self->_ops[0];
1616 void ir_phi_add(ir_instr* self, ir_block *b, ir_value *v)
1620 if (!vec_ir_block_find(self->owner->entries, b, NULL)) {
1621 /* Must not be possible to cause this, otherwise the AST
1622 * is doing something wrong.
1624 irerror(self->context, "Invalid entry block for PHI");
1630 vec_push(v->reads, self);
1631 vec_push(self->phi, pe);
1634 /* call related code */
1635 ir_instr* ir_block_create_call(ir_block *self, lex_ctx ctx, const char *label, ir_value *func, bool noreturn)
1639 if (!ir_check_unreachable(self))
1641 in = ir_instr_new(ctx, self, (noreturn ? VINSTR_NRCALL : INSTR_CALL0));
1646 self->is_return = true;
1648 out = ir_value_out(self->owner, label, (func->outtype == TYPE_VOID) ? store_return : store_value, func->outtype);
1650 ir_instr_delete(in);
1653 if (!ir_instr_op(in, 0, out, true) ||
1654 !ir_instr_op(in, 1, func, false))
1656 ir_instr_delete(in);
1657 ir_value_delete(out);
1660 vec_push(self->instr, in);
1663 if (!ir_block_create_return(self, ctx, NULL)) {
1664 compile_error(ctx, "internal error: failed to generate dummy-return instruction");
1665 ir_instr_delete(in);
1673 ir_value* ir_call_value(ir_instr *self)
1675 return self->_ops[0];
1678 void ir_call_param(ir_instr* self, ir_value *v)
1680 vec_push(self->params, v);
1681 vec_push(v->reads, self);
1684 /* binary op related code */
1686 ir_value* ir_block_create_binop(ir_block *self, lex_ctx ctx,
1687 const char *label, int opcode,
1688 ir_value *left, ir_value *right)
1710 case INSTR_SUB_S: /* -- offset of string as float */
1715 case INSTR_BITOR_IF:
1716 case INSTR_BITOR_FI:
1717 case INSTR_BITAND_FI:
1718 case INSTR_BITAND_IF:
1733 case INSTR_BITAND_I:
1736 case INSTR_RSHIFT_I:
1737 case INSTR_LSHIFT_I:
1759 /* boolean operations result in floats */
1760 if (opcode >= INSTR_EQ_F && opcode <= INSTR_GT)
1762 else if (opcode >= INSTR_LE && opcode <= INSTR_GT)
1765 else if (opcode >= INSTR_LE_I && opcode <= INSTR_EQ_FI)
1770 if (ot == TYPE_VOID) {
1771 /* The AST or parser were supposed to check this! */
1775 return ir_block_create_general_instr(self, ctx, label, opcode, left, right, ot);
1778 ir_value* ir_block_create_unary(ir_block *self, lex_ctx ctx,
1779 const char *label, int opcode,
1782 int ot = TYPE_FLOAT;
1794 /* QC doesn't have other unary operations. We expect extensions to fill
1795 * the above list, otherwise we assume out-type = in-type, eg for an
1799 ot = operand->vtype;
1802 if (ot == TYPE_VOID) {
1803 /* The AST or parser were supposed to check this! */
1807 /* let's use the general instruction creator and pass NULL for OPB */
1808 return ir_block_create_general_instr(self, ctx, label, opcode, operand, NULL, ot);
1811 ir_value* ir_block_create_general_instr(ir_block *self, lex_ctx ctx, const char *label,
1812 int op, ir_value *a, ir_value *b, int outype)
1817 out = ir_value_out(self->owner, label, store_value, outype);
1821 instr = ir_instr_new(ctx, self, op);
1823 ir_value_delete(out);
1827 if (!ir_instr_op(instr, 0, out, true) ||
1828 !ir_instr_op(instr, 1, a, false) ||
1829 !ir_instr_op(instr, 2, b, false) )
1834 vec_push(self->instr, instr);
1838 ir_instr_delete(instr);
1839 ir_value_delete(out);
1843 ir_value* ir_block_create_fieldaddress(ir_block *self, lex_ctx ctx, const char *label, ir_value *ent, ir_value *field)
1847 /* Support for various pointer types todo if so desired */
1848 if (ent->vtype != TYPE_ENTITY)
1851 if (field->vtype != TYPE_FIELD)
1854 v = ir_block_create_general_instr(self, ctx, label, INSTR_ADDRESS, ent, field, TYPE_POINTER);
1855 v->fieldtype = field->fieldtype;
1859 ir_value* ir_block_create_load_from_ent(ir_block *self, lex_ctx ctx, const char *label, ir_value *ent, ir_value *field, int outype)
1862 if (ent->vtype != TYPE_ENTITY)
1865 /* at some point we could redirect for TYPE_POINTER... but that could lead to carelessness */
1866 if (field->vtype != TYPE_FIELD)
1871 case TYPE_FLOAT: op = INSTR_LOAD_F; break;
1872 case TYPE_VECTOR: op = INSTR_LOAD_V; break;
1873 case TYPE_STRING: op = INSTR_LOAD_S; break;
1874 case TYPE_FIELD: op = INSTR_LOAD_FLD; break;
1875 case TYPE_ENTITY: op = INSTR_LOAD_ENT; break;
1876 case TYPE_FUNCTION: op = INSTR_LOAD_FNC; break;
1878 case TYPE_POINTER: op = INSTR_LOAD_I; break;
1879 case TYPE_INTEGER: op = INSTR_LOAD_I; break;
1882 irerror(self->context, "invalid type for ir_block_create_load_from_ent: %s", type_name[outype]);
1886 return ir_block_create_general_instr(self, ctx, label, op, ent, field, outype);
1889 /* PHI resolving breaks the SSA, and must thus be the last
1890 * step before life-range calculation.
1893 static bool ir_block_naive_phi(ir_block *self);
1894 bool ir_function_naive_phi(ir_function *self)
1898 for (i = 0; i < vec_size(self->blocks); ++i)
1900 if (!ir_block_naive_phi(self->blocks[i]))
1907 static bool ir_naive_phi_emit_store(ir_block *block, size_t iid, ir_value *old, ir_value *what)
1912 /* create a store */
1913 if (!ir_block_create_store(block, old, what))
1916 /* we now move it up */
1917 instr = vec_last(block->instr);
1918 for (i = vec_size(block->instr)-1; i > iid; --i)
1919 block->instr[i] = block->instr[i-1];
1920 block->instr[i] = instr;
1926 static bool ir_block_naive_phi(ir_block *self)
1928 size_t i, p; /*, w;*/
1929 /* FIXME: optionally, create_phi can add the phis
1930 * to a list so we don't need to loop through blocks
1931 * - anyway: "don't optimize YET"
1933 for (i = 0; i < vec_size(self->instr); ++i)
1935 ir_instr *instr = self->instr[i];
1936 if (instr->opcode != VINSTR_PHI)
1939 vec_remove(self->instr, i, 1);
1940 --i; /* NOTE: i+1 below */
1942 for (p = 0; p < vec_size(instr->phi); ++p)
1944 ir_value *v = instr->phi[p].value;
1945 ir_block *b = instr->phi[p].from;
1947 if (v->store == store_value &&
1948 vec_size(v->reads) == 1 &&
1949 vec_size(v->writes) == 1)
1951 /* replace the value */
1952 if (!ir_instr_op(v->writes[0], 0, instr->_ops[0], true))
1957 /* force a move instruction */
1958 ir_instr *prevjump = vec_last(b->instr);
1961 instr->_ops[0]->store = store_global;
1962 if (!ir_block_create_store(b, instr->context, instr->_ops[0], v))
1964 instr->_ops[0]->store = store_value;
1965 vec_push(b->instr, prevjump);
1970 ir_value *v = instr->phi[p].value;
1971 for (w = 0; w < vec_size(v->writes); ++w) {
1974 if (!v->writes[w]->_ops[0])
1977 /* When the write was to a global, we have to emit a mov */
1978 old = v->writes[w]->_ops[0];
1980 /* The original instruction now writes to the PHI target local */
1981 if (v->writes[w]->_ops[0] == v)
1982 v->writes[w]->_ops[0] = instr->_ops[0];
1984 if (old->store != store_value && old->store != store_local && old->store != store_param)
1986 /* If it originally wrote to a global we need to store the value
1989 if (!ir_naive_phi_emit_store(self, i+1, old, v))
1991 if (i+1 < vec_size(self->instr))
1992 instr = self->instr[i+1];
1995 /* In case I forget and access instr later, it'll be NULL
1996 * when it's a problem, to make sure we crash, rather than accessing
2002 /* If it didn't, we can replace all reads by the phi target now. */
2004 for (r = 0; r < vec_size(old->reads); ++r)
2007 ir_instr *ri = old->reads[r];
2008 for (op = 0; op < vec_size(ri->phi); ++op) {
2009 if (ri->phi[op].value == old)
2010 ri->phi[op].value = v;
2012 for (op = 0; op < 3; ++op) {
2013 if (ri->_ops[op] == old)
2021 ir_instr_delete(instr);
2026 /***********************************************************************
2027 *IR Temp allocation code
2028 * Propagating value life ranges by walking through the function backwards
2029 * until no more changes are made.
2030 * In theory this should happen once more than once for every nested loop
2032 * Though this implementation might run an additional time for if nests.
2035 /* Enumerate instructions used by value's life-ranges
2037 static void ir_block_enumerate(ir_block *self, size_t *_eid)
2041 for (i = 0; i < vec_size(self->instr); ++i)
2043 self->instr[i]->eid = eid++;
2048 /* Enumerate blocks and instructions.
2049 * The block-enumeration is unordered!
2050 * We do not really use the block enumreation, however
2051 * the instruction enumeration is important for life-ranges.
2053 void ir_function_enumerate(ir_function *self)
2056 size_t instruction_id = 1;
2057 for (i = 0; i < vec_size(self->blocks); ++i)
2059 self->blocks[i]->eid = i;
2060 self->blocks[i]->run_id = 0;
2061 ir_block_enumerate(self->blocks[i], &instruction_id);
2065 static bool ir_block_life_propagate(ir_block *b, ir_block *prev, bool *changed);
2066 bool ir_function_calculate_liferanges(ir_function *self)
2071 /* parameters live at 0 */
2072 for (i = 0; i < vec_size(self->params); ++i)
2073 ir_value_life_merge(self->locals[i], 0);
2078 for (i = 0; i != vec_size(self->blocks); ++i)
2080 if (self->blocks[i]->is_return)
2082 vec_free(self->blocks[i]->living);
2083 if (!ir_block_life_propagate(self->blocks[i], NULL, &changed))
2088 if (vec_size(self->blocks)) {
2089 ir_block *block = self->blocks[0];
2090 for (i = 0; i < vec_size(block->living); ++i) {
2091 ir_value *v = block->living[i];
2092 if (v->store != store_local)
2094 if (v->vtype == TYPE_VECTOR)
2096 self->flags |= IR_FLAG_HAS_UNINITIALIZED;
2097 /* find the instruction reading from it */
2098 for (s = 0; s < vec_size(v->reads); ++s) {
2099 if (v->reads[s]->eid == v->life[0].end)
2102 if (s < vec_size(v->reads)) {
2103 if (irwarning(v->context, WARN_USED_UNINITIALIZED,
2104 "variable `%s` may be used uninitialized in this function\n"
2107 v->reads[s]->context.file, v->reads[s]->context.line)
2115 ir_value *vec = v->memberof;
2116 for (s = 0; s < vec_size(vec->reads); ++s) {
2117 if (vec->reads[s]->eid == v->life[0].end)
2120 if (s < vec_size(vec->reads)) {
2121 if (irwarning(v->context, WARN_USED_UNINITIALIZED,
2122 "variable `%s` may be used uninitialized in this function\n"
2125 vec->reads[s]->context.file, vec->reads[s]->context.line)
2133 if (irwarning(v->context, WARN_USED_UNINITIALIZED,
2134 "variable `%s` may be used uninitialized in this function", v->name))
2143 /* Local-value allocator
2144 * After finishing creating the liferange of all values used in a function
2145 * we can allocate their global-positions.
2146 * This is the counterpart to register-allocation in register machines.
2153 } function_allocator;
2155 static bool function_allocator_alloc(function_allocator *alloc, ir_value *var)
2158 size_t vsize = ir_value_sizeof(var);
2160 var->code.local = vec_size(alloc->locals);
2162 slot = ir_value_var("reg", store_global, var->vtype);
2166 if (!ir_value_life_merge_into(slot, var))
2169 vec_push(alloc->locals, slot);
2170 vec_push(alloc->sizes, vsize);
2171 vec_push(alloc->unique, var->unique_life);
2176 ir_value_delete(slot);
2180 static bool ir_function_allocator_assign(ir_function *self, function_allocator *alloc, ir_value *v)
2185 for (a = 0; a < vec_size(alloc->locals); ++a)
2187 /* if it's reserved for a unique liferange: skip */
2188 if (alloc->unique[a])
2191 slot = alloc->locals[a];
2193 /* never resize parameters
2194 * will be required later when overlapping temps + locals
2196 if (a < vec_size(self->params) &&
2197 alloc->sizes[a] < ir_value_sizeof(v))
2202 if (ir_values_overlap(v, slot))
2205 if (!ir_value_life_merge_into(slot, v))
2208 /* adjust size for this slot */
2209 if (alloc->sizes[a] < ir_value_sizeof(v))
2210 alloc->sizes[a] = ir_value_sizeof(v);
2215 if (a >= vec_size(alloc->locals)) {
2216 if (!function_allocator_alloc(alloc, v))
2222 bool ir_function_allocate_locals(ir_function *self)
2227 bool opt_gt = OPTS_OPTIMIZATION(OPTIM_GLOBAL_TEMPS);
2231 function_allocator lockalloc, globalloc;
2233 if (!vec_size(self->locals) && !vec_size(self->values))
2236 globalloc.locals = NULL;
2237 globalloc.sizes = NULL;
2238 globalloc.positions = NULL;
2239 globalloc.unique = NULL;
2240 lockalloc.locals = NULL;
2241 lockalloc.sizes = NULL;
2242 lockalloc.positions = NULL;
2243 lockalloc.unique = NULL;
2245 for (i = 0; i < vec_size(self->locals); ++i)
2247 v = self->locals[i];
2248 if (!OPTS_OPTIMIZATION(OPTIM_LOCAL_TEMPS)) {
2250 v->unique_life = true;
2252 else if (i >= vec_size(self->params))
2255 v->locked = true; /* lock parameters locals */
2256 if (!function_allocator_alloc((v->locked || !opt_gt ? &lockalloc : &globalloc), self->locals[i]))
2259 for (; i < vec_size(self->locals); ++i)
2261 v = self->locals[i];
2262 if (!vec_size(v->life))
2264 if (!ir_function_allocator_assign(self, (v->locked || !opt_gt ? &lockalloc : &globalloc), v))
2268 /* Allocate a slot for any value that still exists */
2269 for (i = 0; i < vec_size(self->values); ++i)
2271 v = self->values[i];
2273 if (!vec_size(v->life))
2276 /* CALL optimization:
2277 * If the value is a parameter-temp: 1 write, 1 read from a CALL
2278 * and it's not "locked", write it to the OFS_PARM directly.
2280 if (OPTS_OPTIMIZATION(OPTIM_CALL_STORES) && !v->locked && !v->unique_life) {
2281 if (vec_size(v->reads) == 1 && vec_size(v->writes) == 1 &&
2282 (v->reads[0]->opcode == VINSTR_NRCALL ||
2283 (v->reads[0]->opcode >= INSTR_CALL0 && v->reads[0]->opcode <= INSTR_CALL8)
2288 ir_instr *call = v->reads[0];
2289 if (!vec_ir_value_find(call->params, v, ¶m)) {
2290 irerror(call->context, "internal error: unlocked parameter %s not found", v->name);
2294 ++opts_optimizationcount[OPTIM_CALL_STORES];
2295 v->callparam = true;
2297 ir_value_code_setaddr(v, OFS_PARM0 + 3*param);
2301 if (vec_size(self->owner->extparam_protos) <= param)
2302 ep = ir_gen_extparam_proto(self->owner);
2304 ep = self->owner->extparam_protos[param];
2305 ir_instr_op(v->writes[0], 0, ep, true);
2306 call->params[param+8] = ep;
2310 if (vec_size(v->writes) == 1 && v->writes[0]->opcode == INSTR_CALL0)
2312 v->store = store_return;
2313 ++opts_optimizationcount[OPTIM_CALL_STORES];
2318 if (!ir_function_allocator_assign(self, (v->locked || !opt_gt ? &lockalloc : &globalloc), v))
2322 if (!lockalloc.sizes && !globalloc.sizes) {
2325 vec_push(lockalloc.positions, 0);
2326 vec_push(globalloc.positions, 0);
2328 /* Adjust slot positions based on sizes */
2329 if (lockalloc.sizes) {
2330 pos = (vec_size(lockalloc.sizes) ? lockalloc.positions[0] : 0);
2331 for (i = 1; i < vec_size(lockalloc.sizes); ++i)
2333 pos = lockalloc.positions[i-1] + lockalloc.sizes[i-1];
2334 vec_push(lockalloc.positions, pos);
2336 self->allocated_locals = pos + vec_last(lockalloc.sizes);
2338 if (globalloc.sizes) {
2339 pos = (vec_size(globalloc.sizes) ? globalloc.positions[0] : 0);
2340 for (i = 1; i < vec_size(globalloc.sizes); ++i)
2342 pos = globalloc.positions[i-1] + globalloc.sizes[i-1];
2343 vec_push(globalloc.positions, pos);
2345 self->globaltemps = pos + vec_last(globalloc.sizes);
2348 /* Locals need to know their new position */
2349 for (i = 0; i < vec_size(self->locals); ++i) {
2350 v = self->locals[i];
2351 if (i >= vec_size(self->params) && !vec_size(v->life))
2353 if (v->locked || !opt_gt)
2354 v->code.local = lockalloc.positions[v->code.local];
2356 v->code.local = globalloc.positions[v->code.local];
2358 /* Take over the actual slot positions on values */
2359 for (i = 0; i < vec_size(self->values); ++i) {
2360 v = self->values[i];
2361 if (!vec_size(v->life))
2363 if (v->locked || !opt_gt)
2364 v->code.local = lockalloc.positions[v->code.local];
2366 v->code.local = globalloc.positions[v->code.local];
2374 for (i = 0; i < vec_size(lockalloc.locals); ++i)
2375 ir_value_delete(lockalloc.locals[i]);
2376 for (i = 0; i < vec_size(globalloc.locals); ++i)
2377 ir_value_delete(globalloc.locals[i]);
2378 vec_free(globalloc.unique);
2379 vec_free(globalloc.locals);
2380 vec_free(globalloc.sizes);
2381 vec_free(globalloc.positions);
2382 vec_free(lockalloc.unique);
2383 vec_free(lockalloc.locals);
2384 vec_free(lockalloc.sizes);
2385 vec_free(lockalloc.positions);
2389 /* Get information about which operand
2390 * is read from, or written to.
2392 static void ir_op_read_write(int op, size_t *read, size_t *write)
2412 case INSTR_STOREP_F:
2413 case INSTR_STOREP_V:
2414 case INSTR_STOREP_S:
2415 case INSTR_STOREP_ENT:
2416 case INSTR_STOREP_FLD:
2417 case INSTR_STOREP_FNC:
2428 static bool ir_block_living_add_instr(ir_block *self, size_t eid)
2431 bool changed = false;
2433 for (i = 0; i != vec_size(self->living); ++i)
2435 tempbool = ir_value_life_merge(self->living[i], eid);
2436 changed = changed || tempbool;
2441 static bool ir_block_living_lock(ir_block *self)
2444 bool changed = false;
2445 for (i = 0; i != vec_size(self->living); ++i)
2447 if (!self->living[i]->locked)
2449 self->living[i]->locked = true;
2454 static bool ir_block_life_prop_previous(ir_block* self, ir_block *prev, bool *changed)
2460 /* values which have been read in a previous iteration are now
2461 * in the "living" array even if the previous block doesn't use them.
2462 * So we have to remove whatever does not exist in the previous block.
2463 * They will be re-added on-read, but the liferange merge won't cause
2465 for (i = 0; i < vec_size(self->living); ++i)
2467 if (!vec_ir_value_find(prev->living, self->living[i], NULL)) {
2468 vec_remove(self->living, i, 1);
2474 /* Whatever the previous block still has in its living set
2475 * must now be added to ours as well.
2477 for (i = 0; i < vec_size(prev->living); ++i)
2479 if (vec_ir_value_find(self->living, prev->living[i], NULL))
2481 vec_push(self->living, prev->living[i]);
2483 irerror(self->contextt from prev: %s", self->label, prev->living[i]->_name);
2489 static bool ir_block_life_propagate(ir_block *self, ir_block *prev, bool *changed)
2494 size_t i, o, p, mem;
2495 /* bitmasks which operands are read from or written to */
2504 if (!ir_block_life_prop_previous(self, prev, changed))
2508 i = vec_size(self->instr);
2511 instr = self->instr[i];
2513 /* See which operands are read and write operands */
2514 ir_op_read_write(instr->opcode, &read, &write);
2516 if (instr->opcode == INSTR_MUL_VF)
2518 /* the float source will get an additional lifetime */
2519 tempbool = ir_value_life_merge(instr->_ops[2], instr->eid+1);
2520 *changed = *changed || tempbool;
2522 else if (instr->opcode == INSTR_MUL_FV)
2524 /* the float source will get an additional lifetime */
2525 tempbool = ir_value_life_merge(instr->_ops[1], instr->eid+1);
2526 *changed = *changed || tempbool;
2529 /* Go through the 3 main operands
2530 * writes first, then reads
2532 for (o = 0; o < 3; ++o)
2534 if (!instr->_ops[o]) /* no such operand */
2537 value = instr->_ops[o];
2539 /* We only care about locals */
2540 /* we also calculate parameter liferanges so that locals
2541 * can take up parameter slots */
2542 if (value->store != store_value &&
2543 value->store != store_local &&
2544 value->store != store_param)
2547 /* write operands */
2548 /* When we write to a local, we consider it "dead" for the
2549 * remaining upper part of the function, since in SSA a value
2550 * can only be written once (== created)
2555 bool in_living = vec_ir_value_find(self->living, value, &idx);
2558 /* If the value isn't alive it hasn't been read before... */
2559 /* TODO: See if the warning can be emitted during parsing or AST processing
2560 * otherwise have warning printed here.
2561 * IF printing a warning here: include filecontext_t,
2562 * and make sure it's only printed once
2563 * since this function is run multiple times.
2565 /* con_err( "Value only written %s\n", value->name); */
2566 tempbool = ir_value_life_merge(value, instr->eid);
2567 *changed = *changed || tempbool;
2569 /* since 'living' won't contain it
2570 * anymore, merge the value, since
2573 tempbool = ir_value_life_merge(value, instr->eid);
2574 *changed = *changed || tempbool;
2576 vec_remove(self->living, idx, 1);
2578 /* Removing a vector removes all members */
2579 for (mem = 0; mem < 3; ++mem) {
2580 if (value->members[mem] && vec_ir_value_find(self->living, value->members[mem], &idx)) {
2581 tempbool = ir_value_life_merge(value->members[mem], instr->eid);
2582 *changed = *changed || tempbool;
2583 vec_remove(self->living, idx, 1);
2586 /* Removing the last member removes the vector */
2587 if (value->memberof) {
2588 value = value->memberof;
2589 for (mem = 0; mem < 3; ++mem) {
2590 if (value->members[mem] && vec_ir_value_find(self->living, value->members[mem], NULL))
2593 if (mem == 3 && vec_ir_value_find(self->living, value, &idx)) {
2594 tempbool = ir_value_life_merge(value, instr->eid);
2595 *changed = *changed || tempbool;
2596 vec_remove(self->living, idx, 1);
2602 for (o = 0; o < 3; ++o)
2604 if (!instr->_ops[o]) /* no such operand */
2607 value = instr->_ops[o];
2609 /* We only care about locals */
2610 /* we also calculate parameter liferanges so that locals
2611 * can take up parameter slots */
2612 if (value->store != store_value &&
2613 value->store != store_local &&
2614 value->store != store_param)
2620 if (!vec_ir_value_find(self->living, value, NULL))
2621 vec_push(self->living, value);
2622 /* reading adds the full vector */
2623 if (value->memberof && !vec_ir_value_find(self->living, value->memberof, NULL))
2624 vec_push(self->living, value->memberof);
2625 for (mem = 0; mem < 3; ++mem) {
2626 if (value->members[mem] && !vec_ir_value_find(self->living, value->members[mem], NULL))
2627 vec_push(self->living, value->members[mem]);
2631 /* PHI operands are always read operands */
2632 for (p = 0; p < vec_size(instr->phi); ++p)
2634 value = instr->phi[p].value;
2635 if (!vec_ir_value_find(self->living, value, NULL))
2636 vec_push(self->living, value);
2637 /* reading adds the full vector */
2638 if (value->memberof && !vec_ir_value_find(self->living, value->memberof, NULL))
2639 vec_push(self->living, value->memberof);
2640 for (mem = 0; mem < 3; ++mem) {
2641 if (value->members[mem] && !vec_ir_value_find(self->living, value->members[mem], NULL))
2642 vec_push(self->living, value->members[mem]);
2646 /* on a call, all these values must be "locked" */
2647 if (instr->opcode >= INSTR_CALL0 && instr->opcode <= INSTR_CALL8) {
2648 if (ir_block_living_lock(self))
2651 /* call params are read operands too */
2652 for (p = 0; p < vec_size(instr->params); ++p)
2654 value = instr->params[p];
2655 if (!vec_ir_value_find(self->living, value, NULL))
2656 vec_push(self->living, value);
2657 /* reading adds the full vector */
2658 if (value->memberof && !vec_ir_value_find(self->living, value->memberof, NULL))
2659 vec_push(self->living, value->memberof);
2660 for (mem = 0; mem < 3; ++mem) {
2661 if (value->members[mem] && !vec_ir_value_find(self->living, value->members[mem], NULL))
2662 vec_push(self->living, value->members[mem]);
2667 tempbool = ir_block_living_add_instr(self, instr->eid);
2668 /*con_err( "living added values\n");*/
2669 *changed = *changed || tempbool;
2673 if (self->run_id == self->owner->run_id)
2676 self->run_id = self->owner->run_id;
2678 for (i = 0; i < vec_size(self->entries); ++i)
2680 ir_block *entry = self->entries[i];
2681 ir_block_life_propagate(entry, self, changed);
2687 /***********************************************************************
2690 * Since the IR has the convention of putting 'write' operands
2691 * at the beginning, we have to rotate the operands of instructions
2692 * properly in order to generate valid QCVM code.
2694 * Having destinations at a fixed position is more convenient. In QC
2695 * this is *mostly* OPC, but FTE adds at least 2 instructions which
2696 * read from from OPA, and store to OPB rather than OPC. Which is
2697 * partially the reason why the implementation of these instructions
2698 * in darkplaces has been delayed for so long.
2700 * Breaking conventions is annoying...
2702 static bool ir_builder_gen_global(ir_builder *self, ir_value *global, bool islocal);
2704 static bool gen_global_field(ir_value *global)
2706 if (global->hasvalue)
2708 ir_value *fld = global->constval.vpointer;
2710 irerror(global->context, "Invalid field constant with no field: %s", global->name);
2714 /* copy the field's value */
2715 ir_value_code_setaddr(global, vec_size(code_globals));
2716 vec_push(code_globals, fld->code.fieldaddr);
2717 if (global->fieldtype == TYPE_VECTOR) {
2718 vec_push(code_globals, fld->code.fieldaddr+1);
2719 vec_push(code_globals, fld->code.fieldaddr+2);
2724 ir_value_code_setaddr(global, vec_size(code_globals));
2725 vec_push(code_globals, 0);
2726 if (global->fieldtype == TYPE_VECTOR) {
2727 vec_push(code_globals, 0);
2728 vec_push(code_globals, 0);
2731 if (global->code.globaladdr < 0)
2736 static bool gen_global_pointer(ir_value *global)
2738 if (global->hasvalue)
2740 ir_value *target = global->constval.vpointer;
2742 irerror(global->context, "Invalid pointer constant: %s", global->name);
2743 /* NULL pointers are pointing to the NULL constant, which also
2744 * sits at address 0, but still has an ir_value for itself.
2749 /* Here, relocations ARE possible - in fteqcc-enhanced-qc:
2750 * void() foo; <- proto
2751 * void() *fooptr = &foo;
2752 * void() foo = { code }
2754 if (!target->code.globaladdr) {
2755 /* FIXME: Check for the constant nullptr ir_value!
2756 * because then code.globaladdr being 0 is valid.
2758 irerror(global->context, "FIXME: Relocation support");
2762 ir_value_code_setaddr(global, vec_size(code_globals));
2763 vec_push(code_globals, target->code.globaladdr);
2767 ir_value_code_setaddr(global, vec_size(code_globals));
2768 vec_push(code_globals, 0);
2770 if (global->code.globaladdr < 0)
2775 static bool gen_blocks_recursive(ir_function *func, ir_block *block)
2777 prog_section_statement stmt;
2786 block->generated = true;
2787 block->code_start = vec_size(code_statements);
2788 for (i = 0; i < vec_size(block->instr); ++i)
2790 instr = block->instr[i];
2792 if (instr->opcode == VINSTR_PHI) {
2793 irerror(block->context, "cannot generate virtual instruction (phi)");
2797 if (instr->opcode == VINSTR_JUMP) {
2798 target = instr->bops[0];
2799 /* for uncoditional jumps, if the target hasn't been generated
2800 * yet, we generate them right here.
2802 if (!target->generated) {
2807 /* otherwise we generate a jump instruction */
2808 stmt.opcode = INSTR_GOTO;
2809 stmt.o1.s1 = (target->code_start) - vec_size(code_statements);
2812 if (stmt.o1.s1 != 1)
2813 code_push_statement(&stmt, instr->context.line);
2815 /* no further instructions can be in this block */
2819 if (instr->opcode == VINSTR_COND) {
2820 ontrue = instr->bops[0];
2821 onfalse = instr->bops[1];
2822 /* TODO: have the AST signal which block should
2823 * come first: eg. optimize IFs without ELSE...
2826 stmt.o1.u1 = ir_value_code_addr(instr->_ops[0]);
2830 if (ontrue->generated) {
2831 stmt.opcode = INSTR_IF;
2832 stmt.o2.s1 = (ontrue->code_start) - vec_size(code_statements);
2833 if (stmt.o2.s1 != 1)
2834 code_push_statement(&stmt, instr->context.line);
2836 if (onfalse->generated) {
2837 stmt.opcode = INSTR_IFNOT;
2838 stmt.o2.s1 = (onfalse->code_start) - vec_size(code_statements);
2839 if (stmt.o2.s1 != 1)
2840 code_push_statement(&stmt, instr->context.line);
2842 if (!ontrue->generated) {
2843 if (onfalse->generated) {
2848 if (!onfalse->generated) {
2849 if (ontrue->generated) {
2854 /* neither ontrue nor onfalse exist */
2855 stmt.opcode = INSTR_IFNOT;
2856 if (!instr->likely) {
2857 /* Honor the likelyhood hint */
2858 ir_block *tmp = onfalse;
2859 stmt.opcode = INSTR_IF;
2863 stidx = vec_size(code_statements);
2864 code_push_statement(&stmt, instr->context.line);
2865 /* on false we jump, so add ontrue-path */
2866 if (!gen_blocks_recursive(func, ontrue))
2868 /* fixup the jump address */
2869 code_statements[stidx].o2.s1 = vec_size(code_statements) - stidx;
2870 /* generate onfalse path */
2871 if (onfalse->generated) {
2872 /* fixup the jump address */
2873 code_statements[stidx].o2.s1 = (onfalse->code_start) - (stidx);
2874 if (code_statements[stidx].o2.s1 == 1) {
2875 code_statements[stidx] = code_statements[stidx+1];
2876 if (code_statements[stidx].o1.s1 < 0)
2877 code_statements[stidx].o1.s1++;
2878 code_pop_statement();
2880 stmt.opcode = vec_last(code_statements).opcode;
2881 if (stmt.opcode == INSTR_GOTO ||
2882 stmt.opcode == INSTR_IF ||
2883 stmt.opcode == INSTR_IFNOT ||
2884 stmt.opcode == INSTR_RETURN ||
2885 stmt.opcode == INSTR_DONE)
2887 /* no use jumping from here */
2890 /* may have been generated in the previous recursive call */
2891 stmt.opcode = INSTR_GOTO;
2892 stmt.o1.s1 = (onfalse->code_start) - vec_size(code_statements);
2895 if (stmt.o1.s1 != 1)
2896 code_push_statement(&stmt, instr->context.line);
2899 else if (code_statements[stidx].o2.s1 == 1) {
2900 code_statements[stidx] = code_statements[stidx+1];
2901 if (code_statements[stidx].o1.s1 < 0)
2902 code_statements[stidx].o1.s1++;
2903 code_pop_statement();
2905 /* if not, generate now */
2910 if ( (instr->opcode >= INSTR_CALL0 && instr->opcode <= INSTR_CALL8)
2911 || instr->opcode == VINSTR_NRCALL)
2916 first = vec_size(instr->params);
2919 for (p = 0; p < first; ++p)
2921 ir_value *param = instr->params[p];
2922 if (param->callparam)
2925 stmt.opcode = INSTR_STORE_F;
2928 if (param->vtype == TYPE_FIELD)
2929 stmt.opcode = field_store_instr[param->fieldtype];
2931 stmt.opcode = type_store_instr[param->vtype];
2932 stmt.o1.u1 = ir_value_code_addr(param);
2933 stmt.o2.u1 = OFS_PARM0 + 3 * p;
2934 code_push_statement(&stmt, instr->context.line);
2936 /* Now handle extparams */
2937 first = vec_size(instr->params);
2938 for (; p < first; ++p)
2940 ir_builder *ir = func->owner;
2941 ir_value *param = instr->params[p];
2942 ir_value *targetparam;
2944 if (param->callparam)
2947 if (p-8 >= vec_size(ir->extparams))
2948 ir_gen_extparam(ir);
2950 targetparam = ir->extparams[p-8];
2952 stmt.opcode = INSTR_STORE_F;
2955 if (param->vtype == TYPE_FIELD)
2956 stmt.opcode = field_store_instr[param->fieldtype];
2958 stmt.opcode = type_store_instr[param->vtype];
2959 stmt.o1.u1 = ir_value_code_addr(param);
2960 stmt.o2.u1 = ir_value_code_addr(targetparam);
2961 code_push_statement(&stmt, instr->context.line);
2964 stmt.opcode = INSTR_CALL0 + vec_size(instr->params);
2965 if (stmt.opcode > INSTR_CALL8)
2966 stmt.opcode = INSTR_CALL8;
2967 stmt.o1.u1 = ir_value_code_addr(instr->_ops[1]);
2970 code_push_statement(&stmt, instr->context.line);
2972 retvalue = instr->_ops[0];
2973 if (retvalue && retvalue->store != store_return &&
2974 (retvalue->store == store_global || vec_size(retvalue->life)))
2976 /* not to be kept in OFS_RETURN */
2977 if (retvalue->vtype == TYPE_FIELD && OPTS_FLAG(ADJUST_VECTOR_FIELDS))
2978 stmt.opcode = field_store_instr[retvalue->fieldtype];
2980 stmt.opcode = type_store_instr[retvalue->vtype];
2981 stmt.o1.u1 = OFS_RETURN;
2982 stmt.o2.u1 = ir_value_code_addr(retvalue);
2984 code_push_statement(&stmt, instr->context.line);
2989 if (instr->opcode == INSTR_STATE) {
2990 irerror(block->context, "TODO: state instruction");
2994 stmt.opcode = instr->opcode;
2999 /* This is the general order of operands */
3001 stmt.o3.u1 = ir_value_code_addr(instr->_ops[0]);
3004 stmt.o1.u1 = ir_value_code_addr(instr->_ops[1]);
3007 stmt.o2.u1 = ir_value_code_addr(instr->_ops[2]);
3009 if (stmt.opcode == INSTR_RETURN || stmt.opcode == INSTR_DONE)
3011 stmt.o1.u1 = stmt.o3.u1;
3014 else if ((stmt.opcode >= INSTR_STORE_F &&
3015 stmt.opcode <= INSTR_STORE_FNC) ||
3016 (stmt.opcode >= INSTR_STOREP_F &&
3017 stmt.opcode <= INSTR_STOREP_FNC))
3019 /* 2-operand instructions with A -> B */
3020 stmt.o2.u1 = stmt.o3.u1;
3023 /* tiny optimization, don't output
3026 if (stmt.o2.u1 == stmt.o1.u1 &&
3027 OPTS_OPTIMIZATION(OPTIM_PEEPHOLE))
3029 ++opts_optimizationcount[OPTIM_PEEPHOLE];
3034 code_push_statement(&stmt, instr->context.line);
3039 static bool gen_function_code(ir_function *self)
3042 prog_section_statement stmt, *retst;
3044 /* Starting from entry point, we generate blocks "as they come"
3045 * for now. Dead blocks will not be translated obviously.
3047 if (!vec_size(self->blocks)) {
3048 irerror(self->context, "Function '%s' declared without body.", self->name);
3052 block = self->blocks[0];
3053 if (block->generated)
3056 if (!gen_blocks_recursive(self, block)) {
3057 irerror(self->context, "failed to generate blocks for '%s'", self->name);
3061 /* code_write and qcvm -disasm need to know that the function ends here */
3062 retst = &vec_last(code_statements);
3063 if (OPTS_OPTIMIZATION(OPTIM_VOID_RETURN) &&
3064 self->outtype == TYPE_VOID &&
3065 retst->opcode == INSTR_RETURN &&
3066 !retst->o1.u1 && !retst->o2.u1 && !retst->o3.u1)
3068 retst->opcode = INSTR_DONE;
3069 ++opts_optimizationcount[OPTIM_VOID_RETURN];
3071 stmt.opcode = INSTR_DONE;
3075 code_push_statement(&stmt, vec_last(code_linenums));
3080 static qcint ir_builder_filestring(ir_builder *ir, const char *filename)
3082 /* NOTE: filename pointers are copied, we never strdup them,
3083 * thus we can use pointer-comparison to find the string.
3088 for (i = 0; i < vec_size(ir->filenames); ++i) {
3089 if (ir->filenames[i] == filename)
3090 return ir->filestrings[i];
3093 str = code_genstring(filename);
3094 vec_push(ir->filenames, filename);
3095 vec_push(ir->filestrings, str);
3099 static bool gen_global_function(ir_builder *ir, ir_value *global)
3101 prog_section_function fun;
3106 if (!global->hasvalue || (!global->constval.vfunc))
3108 irerror(global->context, "Invalid state of function-global: not constant: %s", global->name);
3112 irfun = global->constval.vfunc;
3114 fun.name = global->code.name;
3115 fun.file = ir_builder_filestring(ir, global->context.file);
3116 fun.profile = 0; /* always 0 */
3117 fun.nargs = vec_size(irfun->params);
3121 for (i = 0;i < 8; ++i) {
3122 if ((int32_t)i >= fun.nargs)
3125 fun.argsize[i] = type_sizeof_[irfun->params[i]];
3129 fun.locals = irfun->allocated_locals;
3132 fun.entry = irfun->builtin+1;
3134 irfun->code_function_def = vec_size(code_functions);
3135 fun.entry = vec_size(code_statements);
3138 vec_push(code_functions, fun);
3142 static ir_value* ir_gen_extparam_proto(ir_builder *ir)
3147 snprintf(name, sizeof(name), "EXTPARM#%i", (int)(vec_size(ir->extparam_protos)+8));
3148 global = ir_value_var(name, store_global, TYPE_VECTOR);
3150 vec_push(ir->extparam_protos, global);
3154 static void ir_gen_extparam(ir_builder *ir)
3156 prog_section_def def;
3159 if (vec_size(ir->extparam_protos) < vec_size(ir->extparams)+1)
3160 global = ir_gen_extparam_proto(ir);
3162 global = ir->extparam_protos[vec_size(ir->extparams)];
3164 def.name = code_genstring(global->name);
3165 def.type = TYPE_VECTOR;
3166 def.offset = vec_size(code_globals);
3168 vec_push(code_defs, def);
3169 ir_value_code_setaddr(global, def.offset);
3170 vec_push(code_globals, 0);
3171 vec_push(code_globals, 0);
3172 vec_push(code_globals, 0);
3174 vec_push(ir->extparams, global);
3177 static bool gen_function_extparam_copy(ir_function *self)
3179 size_t i, ext, numparams;
3181 ir_builder *ir = self->owner;
3183 prog_section_statement stmt;
3185 numparams = vec_size(self->params);
3189 stmt.opcode = INSTR_STORE_F;
3191 for (i = 8; i < numparams; ++i) {
3193 if (ext >= vec_size(ir->extparams))
3194 ir_gen_extparam(ir);
3196 ep = ir->extparams[ext];
3198 stmt.opcode = type_store_instr[self->locals[i]->vtype];
3199 if (self->locals[i]->vtype == TYPE_FIELD &&
3200 self->locals[i]->fieldtype == TYPE_VECTOR)
3202 stmt.opcode = INSTR_STORE_V;
3204 stmt.o1.u1 = ir_value_code_addr(ep);
3205 stmt.o2.u1 = ir_value_code_addr(self->locals[i]);
3206 code_push_statement(&stmt, self->context.line);
3212 static bool gen_function_locals(ir_builder *ir, ir_value *global)
3214 prog_section_function *def;
3217 uint32_t firstlocal, firstglobal;
3219 irfun = global->constval.vfunc;
3220 def = code_functions + irfun->code_function_def;
3222 if (opts.g || !OPTS_OPTIMIZATION(OPTIM_OVERLAP_LOCALS) || (irfun->flags & IR_FLAG_MASK_NO_OVERLAP))
3223 firstlocal = def->firstlocal = vec_size(code_globals);
3225 firstlocal = def->firstlocal = ir->first_common_local;
3226 ++opts_optimizationcount[OPTIM_OVERLAP_LOCALS];
3229 firstglobal = (OPTS_OPTIMIZATION(OPTIM_GLOBAL_TEMPS) ? ir->first_common_globaltemp : firstlocal);
3231 for (i = vec_size(code_globals); i < firstlocal + irfun->allocated_locals; ++i)
3232 vec_push(code_globals, 0);
3233 for (i = 0; i < vec_size(irfun->locals); ++i) {
3234 ir_value *v = irfun->locals[i];
3235 if (v->locked || !OPTS_OPTIMIZATION(OPTIM_GLOBAL_TEMPS)) {
3236 ir_value_code_setaddr(v, firstlocal + v->code.local);
3237 if (!ir_builder_gen_global(ir, irfun->locals[i], true)) {
3238 irerror(irfun->locals[i]->context, "failed to generate local %s", irfun->locals[i]->name);
3243 ir_value_code_setaddr(v, firstglobal + v->code.local);
3245 for (i = 0; i < vec_size(irfun->values); ++i)
3247 ir_value *v = irfun->values[i];
3251 ir_value_code_setaddr(v, firstlocal + v->code.local);
3253 ir_value_code_setaddr(v, firstglobal + v->code.local);
3258 static bool gen_global_function_code(ir_builder *ir, ir_value *global)
3260 prog_section_function *fundef;
3265 irfun = global->constval.vfunc;
3267 if (global->cvq == CV_NONE) {
3268 irwarning(global->context, WARN_IMPLICIT_FUNCTION_POINTER,
3269 "function `%s` has no body and in QC implicitly becomes a function-pointer", global->name);
3271 /* this was a function pointer, don't generate code for those */
3278 if (irfun->code_function_def < 0) {
3279 irerror(irfun->context, "`%s`: IR global wasn't generated, failed to access function-def", irfun->name);
3282 fundef = &code_functions[irfun->code_function_def];
3284 fundef->entry = vec_size(code_statements);
3285 if (!gen_function_locals(ir, global)) {
3286 irerror(irfun->context, "Failed to generate locals for function %s", irfun->name);
3289 if (!gen_function_extparam_copy(irfun)) {
3290 irerror(irfun->context, "Failed to generate extparam-copy code for function %s", irfun->name);
3293 if (!gen_function_code(irfun)) {
3294 irerror(irfun->context, "Failed to generate code for function %s", irfun->name);
3300 static void gen_vector_defs(prog_section_def def, const char *name)
3305 if (!name || name[0] == '#' || OPTS_FLAG(SINGLE_VECTOR_DEFS))
3308 def.type = TYPE_FLOAT;
3312 component = (char*)mem_a(len+3);
3313 memcpy(component, name, len);
3315 component[len-0] = 0;
3316 component[len-2] = '_';
3318 component[len-1] = 'x';
3320 for (i = 0; i < 3; ++i) {
3321 def.name = code_genstring(component);
3322 vec_push(code_defs, def);
3328 static void gen_vector_fields(prog_section_field fld, const char *name)
3333 if (!name || OPTS_FLAG(SINGLE_VECTOR_DEFS))
3336 fld.type = TYPE_FLOAT;
3340 component = (char*)mem_a(len+3);
3341 memcpy(component, name, len);
3343 component[len-0] = 0;
3344 component[len-2] = '_';
3346 component[len-1] = 'x';
3348 for (i = 0; i < 3; ++i) {
3349 fld.name = code_genstring(component);
3350 vec_push(code_fields, fld);
3356 static bool ir_builder_gen_global(ir_builder *self, ir_value *global, bool islocal)
3360 prog_section_def def;
3361 bool pushdef = false;
3363 def.type = global->vtype;
3364 def.offset = vec_size(code_globals);
3366 if (opts.g || !islocal)
3370 if (OPTS_OPTIMIZATION(OPTIM_STRIP_CONSTANT_NAMES) &&
3371 (global->name[0] == '#' || global->cvq == CV_CONST))
3376 if (pushdef && global->name) {
3377 if (global->name[0] == '#') {
3378 if (!self->str_immediate)
3379 self->str_immediate = code_genstring("IMMEDIATE");
3380 def.name = global->code.name = self->str_immediate;
3383 def.name = global->code.name = code_genstring(global->name);
3388 def.offset = ir_value_code_addr(global);
3389 vec_push(code_defs, def);
3390 if (global->vtype == TYPE_VECTOR)
3391 gen_vector_defs(def, global->name);
3392 else if (global->vtype == TYPE_FIELD && global->fieldtype == TYPE_VECTOR)
3393 gen_vector_defs(def, global->name);
3400 switch (global->vtype)
3403 if (!strcmp(global->name, "end_sys_globals")) {
3404 /* TODO: remember this point... all the defs before this one
3405 * should be checksummed and added to progdefs.h when we generate it.
3408 else if (!strcmp(global->name, "end_sys_fields")) {
3409 /* TODO: same as above but for entity-fields rather than globsl
3413 irwarning(global->context, WARN_VOID_VARIABLES, "unrecognized variable of type void `%s`",
3415 /* I'd argue setting it to 0 is sufficient, but maybe some depend on knowing how far
3416 * the system fields actually go? Though the engine knows this anyway...
3417 * Maybe this could be an -foption
3418 * fteqcc creates data for end_sys_* - of size 1, so let's do the same
3420 ir_value_code_setaddr(global, vec_size(code_globals));
3421 vec_push(code_globals, 0);
3423 if (pushdef) vec_push(code_defs, def);
3426 if (pushdef) vec_push(code_defs, def);
3427 return gen_global_pointer(global);
3430 vec_push(code_defs, def);
3431 if (global->fieldtype == TYPE_VECTOR)
3432 gen_vector_defs(def, global->name);
3434 return gen_global_field(global);
3439 ir_value_code_setaddr(global, vec_size(code_globals));
3440 if (global->hasvalue) {
3441 iptr = (int32_t*)&global->constval.ivec[0];
3442 vec_push(code_globals, *iptr);
3444 vec_push(code_globals, 0);
3446 if (!islocal && global->cvq != CV_CONST)
3447 def.type |= DEF_SAVEGLOBAL;
3448 if (pushdef) vec_push(code_defs, def);
3450 return global->code.globaladdr >= 0;
3454 ir_value_code_setaddr(global, vec_size(code_globals));
3455 if (global->hasvalue) {
3456 vec_push(code_globals, code_genstring(global->constval.vstring));
3458 vec_push(code_globals, 0);
3460 if (!islocal && global->cvq != CV_CONST)
3461 def.type |= DEF_SAVEGLOBAL;
3462 if (pushdef) vec_push(code_defs, def);
3463 return global->code.globaladdr >= 0;
3468 ir_value_code_setaddr(global, vec_size(code_globals));
3469 if (global->hasvalue) {
3470 iptr = (int32_t*)&global->constval.ivec[0];
3471 vec_push(code_globals, iptr[0]);
3472 if (global->code.globaladdr < 0)
3474 for (d = 1; d < type_sizeof_[global->vtype]; ++d) {
3475 vec_push(code_globals, iptr[d]);
3478 vec_push(code_globals, 0);
3479 if (global->code.globaladdr < 0)
3481 for (d = 1; d < type_sizeof_[global->vtype]; ++d) {
3482 vec_push(code_globals, 0);
3485 if (!islocal && global->cvq != CV_CONST)
3486 def.type |= DEF_SAVEGLOBAL;
3489 vec_push(code_defs, def);
3490 def.type &= ~DEF_SAVEGLOBAL;
3491 gen_vector_defs(def, global->name);
3493 return global->code.globaladdr >= 0;
3496 ir_value_code_setaddr(global, vec_size(code_globals));
3497 if (!global->hasvalue) {
3498 vec_push(code_globals, 0);
3499 if (global->code.globaladdr < 0)
3502 vec_push(code_globals, vec_size(code_functions));
3503 if (!gen_global_function(self, global))
3506 if (!islocal && global->cvq != CV_CONST)
3507 def.type |= DEF_SAVEGLOBAL;
3508 if (pushdef) vec_push(code_defs, def);
3511 /* assume biggest type */
3512 ir_value_code_setaddr(global, vec_size(code_globals));
3513 vec_push(code_globals, 0);
3514 for (i = 1; i < type_sizeof_[TYPE_VARIANT]; ++i)
3515 vec_push(code_globals, 0);
3518 /* refuse to create 'void' type or any other fancy business. */
3519 irerror(global->context, "Invalid type for global variable `%s`: %s",
3520 global->name, type_name[global->vtype]);
3525 static void ir_builder_prepare_field(ir_value *field)
3527 field->code.fieldaddr = code_alloc_field(type_sizeof_[field->fieldtype]);
3530 static bool ir_builder_gen_field(ir_builder *self, ir_value *field)
3532 prog_section_def def;
3533 prog_section_field fld;
3537 def.type = (uint16_t)field->vtype;
3538 def.offset = (uint16_t)vec_size(code_globals);
3540 /* create a global named the same as the field */
3541 if (opts.standard == COMPILER_GMQCC) {
3542 /* in our standard, the global gets a dot prefix */
3543 size_t len = strlen(field->name);
3546 /* we really don't want to have to allocate this, and 1024
3547 * bytes is more than enough for a variable/field name
3549 if (len+2 >= sizeof(name)) {
3550 irerror(field->context, "invalid field name size: %u", (unsigned int)len);
3555 memcpy(name+1, field->name, len); /* no strncpy - we used strlen above */
3558 def.name = code_genstring(name);
3559 fld.name = def.name + 1; /* we reuse that string table entry */
3561 /* in plain QC, there cannot be a global with the same name,
3562 * and so we also name the global the same.
3563 * FIXME: fteqcc should create a global as well
3564 * check if it actually uses the same name. Probably does
3566 def.name = code_genstring(field->name);
3567 fld.name = def.name;
3570 field->code.name = def.name;
3572 vec_push(code_defs, def);
3574 fld.type = field->fieldtype;
3576 if (fld.type == TYPE_VOID) {
3577 irerror(field->context, "field is missing a type: %s - don't know its size", field->name);
3581 fld.offset = field->code.fieldaddr;
3583 vec_push(code_fields, fld);
3585 ir_value_code_setaddr(field, vec_size(code_globals));
3586 vec_push(code_globals, fld.offset);
3587 if (fld.type == TYPE_VECTOR) {
3588 vec_push(code_globals, fld.offset+1);
3589 vec_push(code_globals, fld.offset+2);
3592 if (field->fieldtype == TYPE_VECTOR) {
3593 gen_vector_defs(def, field->name);
3594 gen_vector_fields(fld, field->name);
3597 return field->code.globaladdr >= 0;
3600 bool ir_builder_generate(ir_builder *self, const char *filename)
3602 prog_section_statement stmt;
3604 char *lnofile = NULL;
3608 for (i = 0; i < vec_size(self->fields); ++i)
3610 ir_builder_prepare_field(self->fields[i]);
3613 for (i = 0; i < vec_size(self->globals); ++i)
3615 if (!ir_builder_gen_global(self, self->globals[i], false)) {
3618 if (self->globals[i]->vtype == TYPE_FUNCTION) {
3619 ir_function *func = self->globals[i]->constval.vfunc;
3620 if (func && self->max_locals < func->allocated_locals &&
3621 !(func->flags & IR_FLAG_MASK_NO_OVERLAP))
3623 self->max_locals = func->allocated_locals;
3625 if (func && self->max_globaltemps < func->globaltemps)
3626 self->max_globaltemps = func->globaltemps;
3630 for (i = 0; i < vec_size(self->fields); ++i)
3632 if (!ir_builder_gen_field(self, self->fields[i])) {
3637 /* generate global temps */
3638 self->first_common_globaltemp = vec_size(code_globals);
3639 for (i = 0; i < self->max_globaltemps; ++i) {
3640 vec_push(code_globals, 0);
3642 /* generate common locals */
3643 self->first_common_local = vec_size(code_globals);
3644 for (i = 0; i < self->max_locals; ++i) {
3645 vec_push(code_globals, 0);
3648 /* generate function code */
3649 for (i = 0; i < vec_size(self->globals); ++i)
3651 if (self->globals[i]->vtype == TYPE_FUNCTION) {
3652 if (!gen_global_function_code(self, self->globals[i])) {
3658 if (vec_size(code_globals) >= 65536) {
3659 irerror(vec_last(self->globals)->context, "This progs file would require more globals than the metadata can handle. Bailing out.");
3663 /* DP errors if the last instruction is not an INSTR_DONE. */
3664 if (vec_last(code_statements).opcode != INSTR_DONE)
3666 stmt.opcode = INSTR_DONE;
3670 code_push_statement(&stmt, vec_last(code_linenums));
3676 if (vec_size(code_statements) != vec_size(code_linenums)) {
3677 con_err("Linecounter wrong: %lu != %lu\n",
3678 (unsigned long)vec_size(code_statements),
3679 (unsigned long)vec_size(code_linenums));
3680 } else if (OPTS_FLAG(LNO)) {
3682 size_t filelen = strlen(filename);
3684 memcpy(vec_add(lnofile, filelen+1), filename, filelen+1);
3685 dot = strrchr(lnofile, '.');
3689 vec_shrinkto(lnofile, dot - lnofile);
3691 memcpy(vec_add(lnofile, 5), ".lno", 5);
3696 con_out("writing '%s' and '%s'...\n", filename, lnofile);
3698 con_out("writing '%s'\n", filename);
3700 if (!code_write(filename, lnofile)) {
3708 /***********************************************************************
3709 *IR DEBUG Dump functions...
3712 #define IND_BUFSZ 1024
3715 # define strncat(dst, src, sz) strncat_s(dst, sz, src, _TRUNCATE)
3718 const char *qc_opname(int op)
3720 if (op < 0) return "<INVALID>";
3721 if (op < (int)( sizeof(asm_instr) / sizeof(asm_instr[0]) ))
3722 return asm_instr[op].m;
3724 case VINSTR_PHI: return "PHI";
3725 case VINSTR_JUMP: return "JUMP";
3726 case VINSTR_COND: return "COND";
3727 default: return "<UNK>";
3731 void ir_builder_dump(ir_builder *b, int (*oprintf)(const char*, ...))
3734 char indent[IND_BUFSZ];
3738 oprintf("module %s\n", b->name);
3739 for (i = 0; i < vec_size(b->globals); ++i)
3742 if (b->globals[i]->hasvalue)
3743 oprintf("%s = ", b->globals[i]->name);
3744 ir_value_dump(b->globals[i], oprintf);
3747 for (i = 0; i < vec_size(b->functions); ++i)
3748 ir_function_dump(b->functions[i], indent, oprintf);
3749 oprintf("endmodule %s\n", b->name);
3752 void ir_function_dump(ir_function *f, char *ind,
3753 int (*oprintf)(const char*, ...))
3756 if (f->builtin != 0) {
3757 oprintf("%sfunction %s = builtin %i\n", ind, f->name, -f->builtin);
3760 oprintf("%sfunction %s\n", ind, f->name);
3761 strncat(ind, "\t", IND_BUFSZ);
3762 if (vec_size(f->locals))
3764 oprintf("%s%i locals:\n", ind, (int)vec_size(f->locals));
3765 for (i = 0; i < vec_size(f->locals); ++i) {
3766 oprintf("%s\t", ind);
3767 ir_value_dump(f->locals[i], oprintf);
3771 oprintf("%sliferanges:\n", ind);
3772 for (i = 0; i < vec_size(f->locals); ++i) {
3773 const char *attr = "";
3775 ir_value *v = f->locals[i];
3776 if (v->unique_life && v->locked)
3777 attr = "unique,locked ";
3778 else if (v->unique_life)
3782 oprintf("%s\t%s: %s@%i ", ind, v->name, attr, (int)v->code.local);
3783 for (l = 0; l < vec_size(v->life); ++l) {
3784 oprintf("[%i,%i] ", v->life[l].start, v->life[l].end);
3787 for (m = 0; m < 3; ++m) {
3788 ir_value *vm = v->members[m];
3791 if (vm->unique_life && vm->locked)
3792 attr = "unique,locked ";
3793 else if (vm->unique_life)
3795 else if (vm->locked)
3797 oprintf("%s\t%s: %s@%i ", ind, vm->name, attr, (int)vm->code.local);
3798 for (l = 0; l < vec_size(vm->life); ++l) {
3799 oprintf("[%i,%i] ", vm->life[l].start, vm->life[l].end);
3804 for (i = 0; i < vec_size(f->values); ++i) {
3806 ir_value *v = f->values[i];
3807 oprintf("%s\t%s: @%i ", ind, v->name, (int)v->code.local);
3808 for (l = 0; l < vec_size(v->life); ++l) {
3809 oprintf("[%i,%i] ", v->life[l].start, v->life[l].end);
3813 if (vec_size(f->blocks))
3815 oprintf("%slife passes (check): %i\n", ind, (int)f->run_id);
3816 for (i = 0; i < vec_size(f->blocks); ++i) {
3817 if (f->blocks[i]->run_id != f->run_id) {
3818 oprintf("%slife pass check fail! %i != %i\n", ind, (int)f->blocks[i]->run_id, (int)f->run_id);
3820 ir_block_dump(f->blocks[i], ind, oprintf);
3824 ind[strlen(ind)-1] = 0;
3825 oprintf("%sendfunction %s\n", ind, f->name);
3828 void ir_block_dump(ir_block* b, char *ind,
3829 int (*oprintf)(const char*, ...))
3832 oprintf("%s:%s\n", ind, b->label);
3833 strncat(ind, "\t", IND_BUFSZ);
3835 for (i = 0; i < vec_size(b->instr); ++i)
3836 ir_instr_dump(b->instr[i], ind, oprintf);
3837 ind[strlen(ind)-1] = 0;
3840 void dump_phi(ir_instr *in, int (*oprintf)(const char*, ...))
3843 oprintf("%s <- phi ", in->_ops[0]->name);
3844 for (i = 0; i < vec_size(in->phi); ++i)
3846 oprintf("([%s] : %s) ", in->phi[i].from->label,
3847 in->phi[i].value->name);
3852 void ir_instr_dump(ir_instr *in, char *ind,
3853 int (*oprintf)(const char*, ...))
3856 const char *comma = NULL;
3858 oprintf("%s (%i) ", ind, (int)in->eid);
3860 if (in->opcode == VINSTR_PHI) {
3861 dump_phi(in, oprintf);
3865 strncat(ind, "\t", IND_BUFSZ);
3867 if (in->_ops[0] && (in->_ops[1] || in->_ops[2])) {
3868 ir_value_dump(in->_ops[0], oprintf);
3869 if (in->_ops[1] || in->_ops[2])
3872 if (in->opcode == INSTR_CALL0 || in->opcode == VINSTR_NRCALL) {
3873 oprintf("CALL%i\t", vec_size(in->params));
3875 oprintf("%s\t", qc_opname(in->opcode));
3877 if (in->_ops[0] && !(in->_ops[1] || in->_ops[2])) {
3878 ir_value_dump(in->_ops[0], oprintf);
3883 for (i = 1; i != 3; ++i) {
3887 ir_value_dump(in->_ops[i], oprintf);
3895 oprintf("[%s]", in->bops[0]->label);
3899 oprintf("%s[%s]", comma, in->bops[1]->label);
3900 if (vec_size(in->params)) {
3901 oprintf("\tparams: ");
3902 for (i = 0; i != vec_size(in->params); ++i) {
3903 oprintf("%s, ", in->params[i]->name);
3907 ind[strlen(ind)-1] = 0;
3910 void ir_value_dump_string(const char *str, int (*oprintf)(const char*, ...))
3913 for (; *str; ++str) {
3915 case '\n': oprintf("\\n"); break;
3916 case '\r': oprintf("\\r"); break;
3917 case '\t': oprintf("\\t"); break;
3918 case '\v': oprintf("\\v"); break;
3919 case '\f': oprintf("\\f"); break;
3920 case '\b': oprintf("\\b"); break;
3921 case '\a': oprintf("\\a"); break;
3922 case '\\': oprintf("\\\\"); break;
3923 case '"': oprintf("\\\""); break;
3924 default: oprintf("%c", *str); break;
3930 void ir_value_dump(ir_value* v, int (*oprintf)(const char*, ...))
3939 oprintf("fn:%s", v->name);
3942 oprintf("%g", v->constval.vfloat);
3945 oprintf("'%g %g %g'",
3948 v->constval.vvec.z);
3951 oprintf("(entity)");
3954 ir_value_dump_string(v->constval.vstring, oprintf);
3958 oprintf("%i", v->constval.vint);
3963 v->constval.vpointer->name);
3967 oprintf("%s", v->name);
3971 void ir_value_dump_life(const ir_value *self, int (*oprintf)(const char*,...))
3974 oprintf("Life of %12s:", self->name);
3975 for (i = 0; i < vec_size(self->life); ++i)
3977 oprintf(" + [%i, %i]\n", self->life[i].start, self->life[i].end);