2 * emit-x86.c: Support functions for emitting x86 code
5 * Dietmar Maurer (dietmar@ximian.com)
6 * Miguel de Icaza (miguel@ximian.com)
8 * (C) 2001 Ximian, Inc.
14 #include <mono/metadata/assembly.h>
15 #include <mono/metadata/loader.h>
16 #include <mono/metadata/cil-coff.h>
17 #include <mono/metadata/tabledefs.h>
18 #include <mono/metadata/class.h>
19 #include <mono/metadata/debug-helpers.h>
20 #include <mono/metadata/mono-endian.h>
21 #include <mono/arch/x86/x86-codegen.h>
22 #include <mono/metadata/profiler-private.h>
30 //#define DEBUG_REGALLOC
31 //#define DEBUG_SPILLS
34 arch_get_reg_name (int regnum)
55 g_assert_not_reached ();
61 * we may want a x86-specific header or we
62 * can just declare it extern in x86.brg.
64 int mono_x86_have_cmov = 0;
67 cpuid (int id, int* p_eax, int* p_ebx, int* p_ecx, int* p_edx)
73 __asm__ __volatile__ (
77 "xorl $0x200000, %%eax\n"
83 "andl $0x200000, %%eax\n"
91 __asm__ __volatile__ ("cpuid"
92 : "=a" (*p_eax), "=b" (*p_ebx), "=c" (*p_ecx), "=d" (*p_edx)
101 mono_cpu_detect (void) {
102 int eax, ebx, ecx, edx;
104 /* Feature Flags function, flags returned in EDX. */
105 if (cpuid(1, &eax, &ebx, &ecx, &edx)) {
106 if (edx & (1U << 15)) {
107 mono_x86_have_cmov = 1;
113 * arch_get_argument_info:
114 * @csig: a method signature
115 * @param_count: the number of parameters to consider
116 * @arg_info: an array to store the result infos
118 * Gathers information on parameters such as size, alignment and
119 * padding. arg_info should be large enought to hold param_count + 1 entries.
121 * Returns the size of the activation frame.
124 arch_get_argument_info (MonoMethodSignature *csig, int param_count, MonoJitArgumentInfo *arg_info)
126 int k, frame_size = 0;
127 int size, align, pad;
130 if (MONO_TYPE_ISSTRUCT (csig->ret)) {
131 frame_size += sizeof (gpointer);
135 arg_info [0].offset = offset;
138 frame_size += sizeof (gpointer);
142 arg_info [0].size = frame_size;
144 for (k = 0; k < param_count; k++) {
147 size = mono_type_native_stack_size (csig->params [k], &align);
149 size = mono_type_stack_size (csig->params [k], &align);
151 frame_size += pad = (align - (frame_size & (align - 1))) & (align - 1);
152 arg_info [k].pad = pad;
154 arg_info [k + 1].pad = 0;
155 arg_info [k + 1].size = size;
157 arg_info [k + 1].offset = offset;
161 align = MONO_FRAME_ALIGNMENT;
162 frame_size += pad = (align - (frame_size & (align - 1))) & (align - 1);
163 arg_info [k].pad = pad;
169 enter_method (MonoMethod *method, char *ebp)
174 MonoJitArgumentInfo *arg_info;
175 MonoMethodSignature *sig;
178 fname = mono_method_full_name (method, TRUE);
179 printf ("ENTER: %s\n(", fname);
182 if (((int)ebp & (MONO_FRAME_ALIGNMENT - 1)) != 0) {
183 g_error ("unaligned stack detected (%p)", ebp);
186 sig = method->signature;
188 arg_info = alloca (sizeof (MonoJitArgumentInfo) * (sig->param_count + 1));
190 arch_get_argument_info (sig, sig->param_count, arg_info);
192 if (MONO_TYPE_ISSTRUCT (method->signature->ret)) {
193 g_assert (!method->signature->ret->byref);
195 printf ("VALUERET:%p, ", *((gpointer *)(ebp + 8)));
198 if (method->signature->hasthis) {
199 gpointer *this = (gpointer *)(ebp + arg_info [0].offset);
200 if (method->klass->valuetype) {
201 printf ("value:%p, ", *this);
203 o = *((MonoObject **)this);
206 class = o->vtable->klass;
208 if (class == mono_defaults.string_class) {
209 printf ("this:[STRING:%p:%s], ", o, mono_string_to_utf8 ((MonoString *)o));
211 printf ("this:%p[%s.%s], ", o, class->name_space, class->name);
214 printf ("this:NULL, ");
218 for (i = 0; i < method->signature->param_count; ++i) {
219 gpointer *cpos = (gpointer *)(ebp + arg_info [i + 1].offset);
220 int size = arg_info [i + 1].size;
222 MonoType *type = method->signature->params [i];
225 printf ("[BYREF:%p], ", *cpos);
226 } else switch (type->type) {
228 case MONO_TYPE_BOOLEAN:
238 printf ("%d, ", *((int *)(cpos)));
240 case MONO_TYPE_STRING: {
241 MonoString *s = *((MonoString **)cpos);
243 g_assert (((MonoObject *)s)->vtable->klass == mono_defaults.string_class);
244 printf ("[STRING:%p:%s], ", s, mono_string_to_utf8 (s));
246 printf ("[STRING:null], ");
249 case MONO_TYPE_CLASS:
250 case MONO_TYPE_OBJECT: {
251 o = *((MonoObject **)cpos);
253 class = o->vtable->klass;
255 if (class == mono_defaults.string_class) {
256 printf ("[STRING:%p:%s], ", o, mono_string_to_utf8 ((MonoString *)o));
257 } else if (class == mono_defaults.int32_class) {
258 printf ("[INT32:%p:%d], ", o, *(gint32 *)((char *)o + sizeof (MonoObject)));
260 printf ("[%s.%s:%p], ", class->name_space, class->name, o);
262 printf ("%p, ", *((gpointer *)(cpos)));
267 case MONO_TYPE_FNPTR:
268 case MONO_TYPE_ARRAY:
269 case MONO_TYPE_SZARRAY:
270 printf ("%p, ", *((gpointer *)(cpos)));
273 printf ("%lld, ", *((gint64 *)(cpos)));
276 printf ("%f, ", *((float *)(cpos)));
279 printf ("%f, ", *((double *)(cpos)));
281 case MONO_TYPE_VALUETYPE:
283 for (j = 0; j < size; j++)
284 printf ("%02x,", *((guint8*)cpos +j));
296 leave_method (MonoMethod *method, int edx, int eax, double test)
301 fname = mono_method_full_name (method, TRUE);
302 printf ("LEAVE: %s", fname);
305 switch (method->signature->ret->type) {
308 case MONO_TYPE_BOOLEAN:
310 printf ("TRUE:%d", eax);
324 printf ("EAX=%d", eax);
326 case MONO_TYPE_STRING: {
327 MonoString *s = (MonoString *)eax;
330 g_assert (((MonoObject *)s)->vtable->klass == mono_defaults.string_class);
331 printf ("[STRING:%p:%s]", s, mono_string_to_utf8 (s));
333 printf ("[STRING:null], ");
336 case MONO_TYPE_OBJECT: {
337 MonoObject *o = (MonoObject *)eax;
340 if (o->vtable->klass == mono_defaults.boolean_class) {
341 printf ("[BOOLEAN:%p:%d]", o, *((guint8 *)o + sizeof (MonoObject)));
342 } else if (o->vtable->klass == mono_defaults.int32_class) {
343 printf ("[INT32:%p:%d]", o, *((gint32 *)((char *)o + sizeof (MonoObject))));
344 } else if (o->vtable->klass == mono_defaults.int64_class) {
345 printf ("[INT64:%p:%lld]", o, *((gint64 *)((char *)o + sizeof (MonoObject))));
347 printf ("[%s.%s:%p]", o->vtable->klass->name_space, o->vtable->klass->name, o);
349 printf ("[OBJECT:%p]", o);
353 case MONO_TYPE_CLASS:
355 case MONO_TYPE_FNPTR:
356 case MONO_TYPE_ARRAY:
357 case MONO_TYPE_SZARRAY:
358 printf ("EAX=%p", (gpointer)eax);
361 *((gint32 *)&l) = eax;
362 *((gint32 *)&l + 1) = edx;
363 printf ("EAX/EDX=%lld", l);
366 printf ("FP=%f\n", test);
369 printf ("(unknown return type)");
376 * arch_emit_prologue:
377 * @cfg: pointer to status information
379 * Emits the function prolog.
382 arch_emit_prologue (MonoFlowGraph *cfg)
384 MonoMethod *method = cfg->method;
385 MonoMethodHeader *header = ((MonoMethodNormal *)method)->header;
386 int i, j, k, alloc_size, pos;
388 x86_push_reg (cfg->code, X86_EBP);
389 x86_mov_reg_reg (cfg->code, X86_EBP, X86_ESP, 4);
391 alloc_size = cfg->locals_size;
394 if (method->save_lmf) {
396 pos += sizeof (MonoLMF);
398 /* save the current IP */
399 cfg->lmfip_offset = cfg->code + 1 - cfg->start;
400 x86_push_imm (cfg->code, 0);
401 /* save all caller saved regs */
402 x86_push_reg (cfg->code, X86_EBX);
403 x86_push_reg (cfg->code, X86_EDI);
404 x86_push_reg (cfg->code, X86_ESI);
405 x86_push_reg (cfg->code, X86_EBP);
407 /* save method info */
408 x86_push_imm (cfg->code, method);
410 /* get the address of lmf for the current thread */
411 mono_add_jump_info (cfg, cfg->code, MONO_JUMP_INFO_ABS, mono_get_lmf_addr);
412 x86_call_code (cfg->code, 0);
415 x86_push_reg (cfg->code, X86_EAX);
416 /* push *lfm (previous_lmf) */
417 x86_push_membase (cfg->code, X86_EAX, 0);
419 x86_mov_membase_reg (cfg->code, X86_EAX, 0, X86_ESP, 4);
423 /* activation frame alignment check */
424 x86_mov_reg_reg (cfg->code, X86_EAX, X86_ESP, 4);
425 x86_alu_reg_imm (cfg->code, X86_AND, X86_EAX, MONO_FRAME_ALIGNMENT - 1);
426 x86_alu_reg_imm (cfg->code, X86_CMP, X86_EAX, 0);
427 x86_branch32 (cfg->code, X86_CC_EQ, 1, FALSE);
428 x86_breakpoint (cfg->code);
432 if (mono_regset_reg_used (cfg->rs, X86_EBX)) {
433 x86_push_reg (cfg->code, X86_EBX);
437 if (mono_regset_reg_used (cfg->rs, X86_EDI)) {
438 x86_push_reg (cfg->code, X86_EDI);
442 if (mono_regset_reg_used (cfg->rs, X86_ESI)) {
443 x86_push_reg (cfg->code, X86_ESI);
450 x86_alu_reg_imm (cfg->code, X86_SUB, X86_ESP, alloc_size);
452 if (mono_jit_trace_calls) {
453 x86_push_reg (cfg->code, X86_EBP);
454 x86_push_imm (cfg->code, cfg->method);
455 x86_mov_reg_imm (cfg->code, X86_EAX, enter_method);
456 x86_call_reg (cfg->code, X86_EAX);
457 x86_alu_reg_imm (cfg->code, X86_ADD, X86_ESP, 8);
459 if (mono_jit_profile) {
460 x86_push_imm (cfg->code, cfg->method);
461 x86_mov_reg_imm (cfg->code, X86_EAX, mono_profiler_method_enter);
462 x86_call_reg (cfg->code, X86_EAX);
463 x86_alu_reg_imm (cfg->code, X86_ADD, X86_ESP, 4);
466 /* initialize local vars */
467 if (header->num_locals) {
468 gboolean unassigned_locals = TRUE;
470 if (cfg->bblocks [0].live_in_set) {
471 i = mono_bitset_find_first (cfg->bblocks [0].live_in_set,
472 cfg->locals_start_index - 1);
473 unassigned_locals = (i >= 0 && i < cfg->locals_start_index +
477 if (unassigned_locals && header->init_locals) {
478 MonoVarInfo *vi = &VARINFO (cfg, cfg->locals_start_index + header->num_locals - 1);
479 int offset = vi->offset;
483 /* do not clear caller saved registers */
486 for (i = 0; i < header->num_locals; ++i) {
487 MonoVarInfo *rv = &VARINFO (cfg, cfg->locals_start_index + i);
490 int ind = 1 << rv->reg;
492 x86_alu_reg_reg (cfg->code, X86_XOR, rv->reg, rv->reg);
497 if (size == 1 || size == 2 || size == 4) {
498 x86_mov_membase_imm (cfg->code, X86_EBP, offset, 0, size);
506 for (k = 0; k < i; k++) {
507 x86_mov_membase_imm (cfg->code, X86_EBP, offset, 0, 4);
512 x86_mov_membase_imm (cfg->code, X86_EBP, offset, 0, 2);
516 x86_mov_membase_imm (cfg->code, X86_EBP, offset, 0, 1);
521 if (!mono_regset_reg_used (cfg->rs, X86_EDI))
522 x86_push_reg (cfg->code, X86_EDI);
523 x86_lea_membase (cfg->code, X86_EDI, X86_EBP, offset);
524 x86_alu_reg_reg (cfg->code, X86_XOR, X86_EAX, X86_EAX);
525 x86_mov_reg_imm (cfg->code, X86_ECX, i);
527 x86_prefix (cfg->code, X86_REP_PREFIX);
528 x86_stosl (cfg->code);
529 for (i = 0; i < j; i++)
530 x86_stosb (cfg->code);
531 if (!mono_regset_reg_used (cfg->rs, X86_EDI))
532 x86_pop_reg (cfg->code, X86_EDI);
536 x86_mov_membase_imm (cfg->code, X86_EBP, offset, 0, 2);
537 x86_mov_membase_imm (cfg->code, X86_EBP, offset + 2, 0, 1);
542 /* we always need to initialize object pointers */
544 for (i = 0; i < header->num_locals; ++i) {
545 MonoType *t = header->locals [i];
546 int offset = VARINFO (cfg, cfg->locals_start_index + i).offset;
549 x86_mov_membase_imm (cfg->code, X86_EBP, offset, 0, 4);
554 case MONO_TYPE_STRING:
555 case MONO_TYPE_CLASS:
556 case MONO_TYPE_ARRAY:
557 case MONO_TYPE_SZARRAY:
558 case MONO_TYPE_OBJECT:
559 x86_mov_membase_imm (cfg->code, X86_EBP, offset, 0, 4);
569 * arch_emit_epilogue:
570 * @cfg: pointer to status information
572 * Emits the function epilog.
575 arch_emit_epilogue (MonoFlowGraph *cfg)
579 * note: with trace and profiling the value on the FP stack may get clobbered.
581 if (mono_jit_trace_calls) {
582 x86_fld_reg (cfg->code, 0);
583 x86_alu_reg_imm (cfg->code, X86_SUB, X86_ESP, 8);
584 x86_fst_membase (cfg->code, X86_ESP, 0, TRUE, TRUE);
585 x86_push_reg (cfg->code, X86_EAX);
586 x86_push_reg (cfg->code, X86_EDX);
587 x86_push_imm (cfg->code, cfg->method);
588 x86_mov_reg_imm (cfg->code, X86_EAX, leave_method);
589 x86_call_reg (cfg->code, X86_EAX);
590 x86_alu_reg_imm (cfg->code, X86_ADD, X86_ESP, 4);
591 x86_pop_reg (cfg->code, X86_EDX);
592 x86_pop_reg (cfg->code, X86_EAX);
593 x86_alu_reg_imm (cfg->code, X86_ADD, X86_ESP, 8);
595 if (mono_jit_profile) {
596 x86_push_reg (cfg->code, X86_EAX);
597 x86_push_reg (cfg->code, X86_EDX);
598 x86_push_imm (cfg->code, cfg->method);
599 x86_mov_reg_imm (cfg->code, X86_EAX, mono_profiler_method_leave);
600 x86_call_reg (cfg->code, X86_EAX);
601 x86_alu_reg_imm (cfg->code, X86_ADD, X86_ESP, 4);
602 x86_pop_reg (cfg->code, X86_EDX);
603 x86_pop_reg (cfg->code, X86_EAX);
606 if (cfg->method->save_lmf) {
607 pos = -sizeof (MonoLMF) - 4;
611 if (mono_regset_reg_used (cfg->rs, X86_EBX)) {
612 x86_mov_reg_membase (cfg->code, X86_EBX, X86_EBP, pos, 4);
615 if (mono_regset_reg_used (cfg->rs, X86_EDI)) {
616 x86_mov_reg_membase (cfg->code, X86_EDI, X86_EBP, pos, 4);
619 if (mono_regset_reg_used (cfg->rs, X86_ESI)) {
620 x86_mov_reg_membase (cfg->code, X86_ESI, X86_EBP, pos, 4);
624 if (cfg->method->save_lmf) {
625 pos = -sizeof (MonoLMF);
627 x86_lea_membase (cfg->code, X86_ESP, X86_EBP, pos);
629 /* ebx = previous_lmf */
630 x86_pop_reg (cfg->code, X86_EBX);
632 x86_pop_reg (cfg->code, X86_EDI);
633 /* *(lmf) = previous_lmf */
634 x86_mov_membase_reg (cfg->code, X86_EDI, 0, X86_EBX, 4);
636 /* discard method info */
637 x86_pop_reg (cfg->code, X86_ESI);
639 /* restore caller saved regs */
640 x86_pop_reg (cfg->code, X86_EBP);
641 x86_pop_reg (cfg->code, X86_ESI);
642 x86_pop_reg (cfg->code, X86_EDI);
643 x86_pop_reg (cfg->code, X86_EBX);
647 x86_leave (cfg->code);
652 init_varinfo (MonoFlowGraph *cfg, MonoVarInfo *vi)
654 vi->range.last_use.abs_pos = 0;
655 vi->range.first_use.pos.bid = 0xffff;
656 vi->range.first_use.pos.tid = 0;
659 vi->varnum = cfg->varinfo->len;
663 arch_allocate_arg (MonoFlowGraph *cfg, MonoJitArgumentInfo *info, MonoValueType type)
667 mono_jit_stats.allocate_var++;
669 init_varinfo (cfg, &vi);
672 SET_VARINFO (vi, type, MONO_ARGVAR, info->offset, info->size);
673 g_array_append_val (cfg->varinfo, vi);
675 return cfg->varinfo->len - 1;
679 arch_allocate_var (MonoFlowGraph *cfg, int size, int align, MonoVarType vartype, MonoValueType type)
683 mono_jit_stats.allocate_var++;
685 init_varinfo (cfg, &vi);
687 if (size != sizeof (gpointer))
690 cfg->locals_size += size;
691 cfg->locals_size += align - 1;
692 cfg->locals_size &= ~(align - 1);
694 SET_VARINFO (vi, type, vartype, - cfg->locals_size, size);
695 g_array_append_val (cfg->varinfo, vi);
697 return cfg->varinfo->len - 1;
701 mono_label_cfg (MonoFlowGraph *cfg)
705 for (i = 0; i < cfg->block_count; i++) {
706 GPtrArray *forest = cfg->bblocks [i].forest;
709 if (!cfg->bblocks [i].reached) /* unreachable code */
714 for (j = 0; j < top; j++) {
715 MBTree *t1 = (MBTree *) g_ptr_array_index (forest, j);
718 mbstate = mono_burg_label (t1, cfg);
721 if (mono_debug_format != MONO_DEBUG_FORMAT_NONE)
723 g_warning ("tree does not match in %s: 0x%04x",
724 mono_method_full_name (cfg->method, TRUE), t1->cli_addr);
725 mono_print_ctree (cfg, t1); printf ("\n\n");
727 mono_print_forest (cfg, forest);
728 g_assert_not_reached ();
737 tree_allocate_regs (MonoFlowGraph *cfg, MBTree *tree, int goal, MonoRegSet *rs,
738 guint8 exclude_mask, int *spillcount)
741 int ern = mono_burg_rule (tree->state, goal);
742 const guint16 *nts = mono_burg_nts [ern];
743 guint8 left_exclude_mask = 0, right_exclude_mask = 0;
746 #ifdef DEBUG_REGALLOC
747 printf ("tree_allocate_regs start %d %08x %d %d\n", tree->op, rs->free_mask, goal,
748 (nts [0] && kids [0] == tree));
751 mono_burg_kids (tree, ern, kids);
757 exclude_mask |= (1 << X86_ECX);
758 left_exclude_mask |= (1 << X86_ECX);
761 case MB_TERM_MUL_OVF:
762 case MB_TERM_MUL_OVF_UN:
767 if (goal == MB_NTERM_reg) {
768 left_exclude_mask |= (1 << X86_EDX);
769 right_exclude_mask |= (1 << X86_EDX) | (1 << X86_EAX);
776 if (nts [0] && kids [0] == tree) {
778 if (!tree_allocate_regs (cfg, kids [0], nts [0], rs, exclude_mask, spillcount))
799 if (nts [1]) { /* two kids */
802 if (!tree_allocate_regs (cfg, kids [0], nts [0], rs, left_exclude_mask, spillcount))
807 if (!tree_allocate_regs (cfg, kids [1], nts [1], rs, right_exclude_mask, spillcount)) {
809 #ifdef DEBUG_REGALLOC
810 printf ("tree_allocate_regs try 1 failed %d %d %d %d\n",
811 nts [1], kids [1]->reg1,
812 kids [1]->reg2,kids [1]->reg3);
816 if (kids [0]->reg1 != -1) {
817 right_exclude_mask |= 1 << kids [0]->reg1;
820 if (kids [0]->reg2 != -1) {
821 right_exclude_mask |= 1 << kids [0]->reg2;
824 if (kids [0]->reg3 != -1) {
825 right_exclude_mask |= 1 << kids [0]->reg3;
829 mono_regset_free_reg (rs, kids [0]->reg1);
830 mono_regset_free_reg (rs, kids [0]->reg2);
831 mono_regset_free_reg (rs, kids [0]->reg3);
833 kids [0]->spilled = 1;
835 if (!tree_allocate_regs (cfg, kids [1], nts [1], rs, right_exclude_mask, spillcount)) {
836 #ifdef DEBUG_REGALLOC
837 printf ("tree_allocate_regs try 2 failed\n");
841 #ifdef DEBUG_REGALLOC
842 printf ("tree_allocate_regs try 2 succesfull\n");
847 if (nts [3]) /* we cant handle four kids */
848 g_assert_not_reached ();
850 if (!tree_allocate_regs (cfg, kids [2], nts [2], rs, right_exclude_mask, spillcount))
855 } else { /* one kid */
856 if (!tree_allocate_regs (cfg, kids [0], nts [0], rs, left_exclude_mask, spillcount))
862 for (i = 0; nts [i]; i++) {
863 mono_regset_free_reg (rs, kids [i]->reg1);
864 mono_regset_free_reg (rs, kids [i]->reg2);
865 mono_regset_free_reg (rs, kids [i]->reg3);
868 tree->emit = mono_burg_func [ern];
871 case MB_TERM_CALL_I4:
872 case MB_TERM_CALL_I8:
873 case MB_TERM_CALL_R8:
874 // case MB_TERM_CALL_VOID :
875 if ((tree->reg1 = mono_regset_alloc_reg (rs, X86_EAX, exclude_mask)) == -1)
877 if ((tree->reg2 = mono_regset_alloc_reg (rs, X86_EDX, exclude_mask)) == -1)
879 if ((tree->reg3 = mono_regset_alloc_reg (rs, X86_ECX, exclude_mask)) == -1)
887 case MB_TERM_MUL_OVF_UN:
892 if ((tree->reg1 = mono_regset_alloc_reg (rs, X86_EAX, exclude_mask)) == -1)
894 if ((tree->reg2 = mono_regset_alloc_reg (rs, X86_EDX, exclude_mask)) == -1)
898 if ((tree->reg1 = mono_regset_alloc_reg (rs, -1, exclude_mask)) == -1)
906 case MB_TERM_MUL_OVF:
907 case MB_TERM_MUL_OVF_UN:
912 if ((tree->reg1 = mono_regset_alloc_reg (rs, X86_EAX, exclude_mask)) == -1)
914 if ((tree->reg2 = mono_regset_alloc_reg (rs, X86_EDX, exclude_mask)) == -1)
918 if ((tree->reg1 = mono_regset_alloc_reg (rs, -1, exclude_mask)) == -1)
920 if ((tree->reg2 = mono_regset_alloc_reg (rs, -1, exclude_mask)) == -1)
926 /* fixme: allocate floating point registers */
930 if (tree->op == MB_TERM_ADD) {
931 if ((tree->reg1 = mono_regset_alloc_reg (rs, tree->left->reg1, exclude_mask)) == -1)
933 if ((tree->reg2 = mono_regset_alloc_reg (rs, tree->right->reg1, exclude_mask)) == -1)
939 if (tree->op == MB_TERM_ADD) {
940 if ((tree->reg1 = mono_regset_alloc_reg (rs, tree->left->reg1, exclude_mask)) == -1)
946 if (tree->op == MB_TERM_SHL ||
947 tree->op == MB_TERM_MUL) {
948 if ((tree->reg1 = mono_regset_alloc_reg (rs, tree->left->reg1, exclude_mask)) == -1)
958 #ifdef DEBUG_REGALLOC
959 printf ("tree_allocate_regs end %d %08x\n", tree->op, rs->free_mask);
965 arch_allocate_regs (MonoFlowGraph *cfg)
967 int i, j, max_spillcount = 0;
969 for (i = 0; i < cfg->block_count; i++) {
970 GPtrArray *forest = cfg->bblocks [i].forest;
973 if (!cfg->bblocks [i].reached) /* unreachable code */
978 for (j = 0; j < top; j++) {
979 MBTree *t1 = (MBTree *) g_ptr_array_index (forest, j);
981 #ifdef DEBUG_REGALLOC
982 printf ("arch_allocate_regs start %d:%d %08x\n", i, j, cfg->rs->free_mask);
984 if (!tree_allocate_regs (cfg, t1, 1, cfg->rs, 0, &spillcount)) {
985 mono_print_ctree (cfg, t1);
987 g_error ("register allocation failed");
990 max_spillcount = MAX (max_spillcount, spillcount);
992 #ifdef DEBUG_REGALLOC
993 printf ("arch_allocate_regs end %d:%d %08x\n", i, j, cfg->rs->free_mask);
995 g_assert (cfg->rs->free_mask == 0xffffffff);
999 /* allocate space for spilled regs */
1001 cfg->spillvars = mono_mempool_alloc0 (cfg->mp, sizeof (gint) * max_spillcount);
1002 cfg->spillcount = max_spillcount;
1004 for (i = 0; i < max_spillcount; i++) {
1006 spillvar = arch_allocate_var (cfg, sizeof (gpointer), sizeof (gpointer),
1007 MONO_TEMPVAR, VAL_I32);
1008 cfg->spillvars [i] = VARINFO (cfg, spillvar).offset;
1013 tree_emit (int goal, MonoFlowGraph *cfg, MBTree *tree, int *spillcount)
1016 int ern = mono_burg_rule (tree->state, goal);
1017 const guint16 *nts = mono_burg_nts [ern];
1021 mono_burg_kids (tree, ern, kids);
1025 int spilloffset1, spilloffset2, spilloffset3;
1027 tree_emit (nts [0], cfg, kids [0], spillcount);
1029 if (kids [0]->spilled) {
1031 printf ("SPILL_REGS %d %03x %s.%s:%s\n",
1032 nts [0], cfg->code - cfg->start,
1033 cfg->method->klass->name_space,
1034 cfg->method->klass->name, cfg->method->name);
1036 mono_print_ctree (cfg, kids [0]);printf ("\n\n");
1042 if (kids [0]->reg1 != -1) {
1043 spilloffset1 = cfg->spillvars [(*spillcount)++];
1044 x86_mov_membase_reg (cfg->code, X86_EBP, spilloffset1,
1047 if (kids [0]->reg2 != -1) {
1048 spilloffset2 = cfg->spillvars [(*spillcount)++];
1049 x86_mov_membase_reg (cfg->code, X86_EBP, spilloffset2,
1052 if (kids [0]->reg3 != -1) {
1053 spilloffset3 = cfg->spillvars [(*spillcount)++];
1054 x86_mov_membase_reg (cfg->code, X86_EBP, spilloffset3,
1059 tree_emit (nts [1], cfg, kids [1], spillcount);
1061 if (kids [0]->spilled) {
1064 printf ("RELOAD_REGS %03x %s.%s:%s\n",
1065 cfg->code - cfg->start,
1066 cfg->method->klass->name_space,
1067 cfg->method->klass->name, cfg->method->name);
1070 if (kids [0]->reg3 != -1)
1071 x86_mov_reg_membase (cfg->code, kids [0]->reg3, X86_EBP,
1073 if (kids [0]->reg2 != -1)
1074 x86_mov_reg_membase (cfg->code, kids [0]->reg2, X86_EBP,
1076 if (kids [0]->reg1 != -1)
1077 x86_mov_reg_membase (cfg->code, kids [0]->reg1, X86_EBP,
1082 g_assert (!nts [3]);
1083 tree_emit (nts [2], cfg, kids [2], spillcount);
1086 tree_emit (nts [0], cfg, kids [0], spillcount);
1090 g_assert ((*spillcount) <= cfg->spillcount);
1092 tree->addr = offset = cfg->code - cfg->start;
1094 /* we assume an instruction uses a maximum of 128 bytes */
1095 if ((cfg->code_size - offset) <= 128) {
1096 int add = MIN (cfg->code_size, 128);
1097 cfg->code_size += add;
1098 mono_jit_stats.code_reallocs++;
1099 cfg->start = g_realloc (cfg->start, cfg->code_size);
1100 g_assert (cfg->start);
1101 cfg->code = cfg->start + offset;
1104 if ((emit = mono_burg_func [ern]))
1107 g_assert ((cfg->code - cfg->start) < cfg->code_size);
1111 mono_emit_cfg (MonoFlowGraph *cfg)
1113 int i, j, spillcount;
1115 for (i = 0; i < cfg->block_count; i++) {
1116 MonoBBlock *bb = &cfg->bblocks [i];
1117 GPtrArray *forest = bb->forest;
1120 if (!bb->reached) /* unreachable code */
1125 bb->addr = cfg->code - cfg->start;
1127 for (j = 0; j < top; j++) {
1128 MBTree *t1 = (MBTree *) g_ptr_array_index (forest, j);
1131 tree_emit (1, cfg, t1, &spillcount);
1135 cfg->epilog = cfg->code - cfg->start;
1139 mono_compute_branches (MonoFlowGraph *cfg)
1147 for (j = 0; j < cfg->block_count; j++) {
1148 MonoBBlock *bb = &cfg->bblocks [j];
1149 GPtrArray *forest = bb->forest;
1152 if (!bb->reached) /* unreachable code */
1157 for (i = 0; i < top; i++) {
1158 MBTree *t1 = (MBTree *) g_ptr_array_index (forest, i);
1160 if (t1->op == MB_TERM_SWITCH) {
1161 MonoBBlock **jt = (MonoBBlock **)t1->data.p;
1162 guint32 *rt = (guint32 *)t1->data.p;
1163 int m = *((guint32 *)t1->data.p) + 1;
1166 for (k = 1; k <= m; k++)
1167 rt [k] = (int)(jt [k]->addr + cfg->start);
1169 /* emit the switch instruction again to update addresses */
1170 cfg->code = cfg->start + t1->addr;
1171 ((MBEmitFunc)t1->emit) (t1, cfg);
1178 for (ji = cfg->jump_info; ji; ji = ji->next) {
1179 unsigned char *ip = GUINT_TO_POINTER (GPOINTER_TO_UINT (ji->ip) + cfg->start);
1180 unsigned char *target;
1183 case MONO_JUMP_INFO_BB:
1184 target = ji->data.bb->addr + cfg->start;
1186 case MONO_JUMP_INFO_ABS:
1187 target = ji->data.target;
1189 case MONO_JUMP_INFO_EPILOG:
1190 target = cfg->epilog + cfg->start;
1192 case MONO_JUMP_INFO_IP:
1193 *(unsigned char**)ip = ip;
1196 g_assert_not_reached ();
1198 x86_patch (ip, target);
1201 /* patch the IP in the LMF saving code */
1202 if (cfg->lmfip_offset) {
1203 *((guint32 *)(cfg->start + cfg->lmfip_offset)) =
1204 (gint32)(cfg->start + cfg->lmfip_offset);
1209 mono_add_jump_info (MonoFlowGraph *cfg, gpointer ip, MonoJumpInfoType type, gpointer target)
1211 MonoJumpInfo *ji = mono_mempool_alloc (cfg->mp, sizeof (MonoJumpInfo));
1214 ji->ip = GUINT_TO_POINTER (GPOINTER_TO_UINT (ip) - GPOINTER_TO_UINT (cfg->start));
1215 ji->data.target = target;
1216 ji->next = cfg->jump_info;
1218 cfg->jump_info = ji;
1222 arch_jit_compile_cfg (MonoDomain *target_domain, MonoFlowGraph *cfg)
1225 guint32 ls_used_mask = 0;
1226 MonoMethod *method = cfg->method;
1229 ji = mono_mempool_alloc0 (target_domain->mp, sizeof (MonoJitInfo));
1231 cfg->rs = mono_regset_new (X86_NREG);
1232 mono_regset_reserve_reg (cfg->rs, X86_ESP);
1233 mono_regset_reserve_reg (cfg->rs, X86_EBP);
1235 /* we can use this regs for global register allocation */
1236 mono_regset_reserve_reg (cfg->rs, X86_EBX);
1237 mono_regset_reserve_reg (cfg->rs, X86_ESI);
1239 if (mono_use_linear_scan) {
1240 mono_linear_scan (cfg, &ls_used_mask);
1241 cfg->rs->used_mask |= ls_used_mask;
1244 if (mono_jit_dump_forest) {
1246 printf ("FOREST %s\n", mono_method_full_name (method, TRUE));
1247 for (i = 0; i < cfg->block_count; i++) {
1248 printf ("BLOCK %d:\n", i);
1249 mono_print_forest (cfg, cfg->bblocks [i].forest);
1253 if (!mono_label_cfg (cfg))
1256 arch_allocate_regs (cfg);
1258 /* align to 8 byte boundary */
1259 cfg->locals_size += 7;
1260 cfg->locals_size &= ~7;
1262 arch_emit_prologue (cfg);
1263 cfg->prologue_end = cfg->code - cfg->start;
1264 mono_emit_cfg (cfg);
1265 arch_emit_epilogue (cfg);
1266 cfg->epilogue_end = cfg->code - cfg->start;
1268 offset = cfg->code - cfg->start;
1269 gap = cfg->code_size - offset;
1271 char *org = cfg->start;
1273 cfg->start = g_realloc (cfg->start, offset);
1275 cfg->start = mono_mempool_alloc (target_domain->code_mp, offset);
1276 memcpy (cfg->start, org, offset);
1279 cfg->code_size = offset;
1280 cfg->code = cfg->start + offset;
1283 mono_compute_branches (cfg);
1285 ji->code_size = cfg->code - cfg->start;
1286 ji->used_regs = cfg->rs->used_mask;
1287 ji->method = method;
1288 ji->code_start = cfg->start;