3 * ARM backend for the Mono code generator
6 * Paolo Molaro (lupus@ximian.com)
7 * Dietmar Maurer (dietmar@ximian.com)
9 * (C) 2003 Ximian, Inc.
10 * Copyright 2003-2011 Novell, Inc (http://www.novell.com)
11 * Copyright 2011 Xamarin, Inc (http://www.xamarin.com)
12 * Licensed under the MIT license. See LICENSE file in the project root for full license information.
17 #include <mono/metadata/abi-details.h>
18 #include <mono/metadata/appdomain.h>
19 #include <mono/metadata/profiler-private.h>
20 #include <mono/metadata/debug-helpers.h>
21 #include <mono/utils/mono-mmap.h>
22 #include <mono/utils/mono-hwcap.h>
23 #include <mono/utils/mono-memory-model.h>
24 #include <mono/utils/mono-threads-coop.h>
30 #include "debugger-agent.h"
32 #include "mono/arch/arm/arm-vfp-codegen.h"
34 /* Sanity check: This makes no sense */
35 #if defined(ARM_FPU_NONE) && (defined(ARM_FPU_VFP) || defined(ARM_FPU_VFP_HARD))
36 #error "ARM_FPU_NONE is defined while one of ARM_FPU_VFP/ARM_FPU_VFP_HARD is defined"
40 * IS_SOFT_FLOAT: Is full software floating point used?
41 * IS_HARD_FLOAT: Is full hardware floating point used?
42 * IS_VFP: Is hardware floating point with software ABI used?
44 * These are not necessarily constants, e.g. IS_SOFT_FLOAT and
45 * IS_VFP may delegate to mono_arch_is_soft_float ().
48 #if defined(ARM_FPU_VFP_HARD)
49 #define IS_SOFT_FLOAT (FALSE)
50 #define IS_HARD_FLOAT (TRUE)
52 #elif defined(ARM_FPU_NONE)
53 #define IS_SOFT_FLOAT (mono_arch_is_soft_float ())
54 #define IS_HARD_FLOAT (FALSE)
55 #define IS_VFP (!mono_arch_is_soft_float ())
57 #define IS_SOFT_FLOAT (FALSE)
58 #define IS_HARD_FLOAT (FALSE)
62 #define THUNK_SIZE (3 * 4)
64 #define ALIGN_TO(val,align) ((((guint64)val) + ((align) - 1)) & ~((align) - 1))
67 void sys_icache_invalidate (void *start, size_t len);
70 /* This mutex protects architecture specific caches */
71 #define mono_mini_arch_lock() mono_os_mutex_lock (&mini_arch_mutex)
72 #define mono_mini_arch_unlock() mono_os_mutex_unlock (&mini_arch_mutex)
73 static mono_mutex_t mini_arch_mutex;
75 static gboolean v5_supported = FALSE;
76 static gboolean v6_supported = FALSE;
77 static gboolean v7_supported = FALSE;
78 static gboolean v7s_supported = FALSE;
79 static gboolean v7k_supported = FALSE;
80 static gboolean thumb_supported = FALSE;
81 static gboolean thumb2_supported = FALSE;
83 * Whenever to use the ARM EABI
85 static gboolean eabi_supported = FALSE;
88 * Whenever to use the iphone ABI extensions:
89 * http://developer.apple.com/library/ios/documentation/Xcode/Conceptual/iPhoneOSABIReference/index.html
90 * Basically, r7 is used as a frame pointer and it should point to the saved r7 + lr.
91 * This is required for debugging/profiling tools to work, but it has some overhead so it should
92 * only be turned on in debug builds.
94 static gboolean iphone_abi = FALSE;
97 * The FPU we are generating code for. This is NOT runtime configurable right now,
98 * since some things like MONO_ARCH_CALLEE_FREGS still depend on defines.
100 static MonoArmFPU arm_fpu;
102 #if defined(ARM_FPU_VFP_HARD)
104 * On armhf, d0-d7 are used for argument passing and d8-d15
105 * must be preserved across calls, which leaves us no room
106 * for scratch registers. So we use d14-d15 but back up their
107 * previous contents to a stack slot before using them - see
108 * mono_arm_emit_vfp_scratch_save/_restore ().
110 static int vfp_scratch1 = ARM_VFP_D14;
111 static int vfp_scratch2 = ARM_VFP_D15;
114 * On armel, d0-d7 do not need to be preserved, so we can
115 * freely make use of them as scratch registers.
117 static int vfp_scratch1 = ARM_VFP_D0;
118 static int vfp_scratch2 = ARM_VFP_D1;
123 static gpointer single_step_tramp, breakpoint_tramp;
124 static gpointer get_tls_tramp;
127 * The code generated for sequence points reads from this location, which is
128 * made read-only when single stepping is enabled.
130 static gpointer ss_trigger_page;
132 /* Enabled breakpoints read from this trigger page */
133 static gpointer bp_trigger_page;
137 * floating point support: on ARM it is a mess, there are at least 3
138 * different setups, each of which binary incompat with the other.
139 * 1) FPA: old and ugly, but unfortunately what current distros use
140 * the double binary format has the two words swapped. 8 double registers.
141 * Implemented usually by kernel emulation.
142 * 2) softfloat: the compiler emulates all the fp ops. Usually uses the
143 * ugly swapped double format (I guess a softfloat-vfp exists, too, though).
144 * 3) VFP: the new and actually sensible and useful FP support. Implemented
145 * in HW or kernel-emulated, requires new tools. I think this is what symbian uses.
147 * We do not care about FPA. We will support soft float and VFP.
149 int mono_exc_esp_offset = 0;
151 #define arm_is_imm12(v) ((v) > -4096 && (v) < 4096)
152 #define arm_is_imm8(v) ((v) > -256 && (v) < 256)
153 #define arm_is_fpimm8(v) ((v) >= -1020 && (v) <= 1020)
155 #define LDR_MASK ((0xf << ARMCOND_SHIFT) | (3 << 26) | (1 << 22) | (1 << 20) | (15 << 12))
156 #define LDR_PC_VAL ((ARMCOND_AL << ARMCOND_SHIFT) | (1 << 26) | (0 << 22) | (1 << 20) | (15 << 12))
157 #define IS_LDR_PC(val) (((val) & LDR_MASK) == LDR_PC_VAL)
159 //#define DEBUG_IMT 0
162 static void mono_arch_compute_omit_fp (MonoCompile *cfg);
166 emit_aotconst (MonoCompile *cfg, guint8 *code, int dreg, int patch_type, gpointer data);
169 mono_arch_regname (int reg)
171 static const char * rnames[] = {
172 "arm_r0", "arm_r1", "arm_r2", "arm_r3", "arm_v1",
173 "arm_v2", "arm_v3", "arm_v4", "arm_v5", "arm_v6",
174 "arm_v7", "arm_fp", "arm_ip", "arm_sp", "arm_lr",
177 if (reg >= 0 && reg < 16)
183 mono_arch_fregname (int reg)
185 static const char * rnames[] = {
186 "arm_f0", "arm_f1", "arm_f2", "arm_f3", "arm_f4",
187 "arm_f5", "arm_f6", "arm_f7", "arm_f8", "arm_f9",
188 "arm_f10", "arm_f11", "arm_f12", "arm_f13", "arm_f14",
189 "arm_f15", "arm_f16", "arm_f17", "arm_f18", "arm_f19",
190 "arm_f20", "arm_f21", "arm_f22", "arm_f23", "arm_f24",
191 "arm_f25", "arm_f26", "arm_f27", "arm_f28", "arm_f29",
194 if (reg >= 0 && reg < 32)
202 emit_big_add (guint8 *code, int dreg, int sreg, int imm)
204 int imm8, rot_amount;
205 if ((imm8 = mono_arm_is_rotated_imm8 (imm, &rot_amount)) >= 0) {
206 ARM_ADD_REG_IMM (code, dreg, sreg, imm8, rot_amount);
210 code = mono_arm_emit_load_imm (code, ARMREG_IP, imm);
211 ARM_ADD_REG_REG (code, dreg, sreg, ARMREG_IP);
213 code = mono_arm_emit_load_imm (code, dreg, imm);
214 ARM_ADD_REG_REG (code, dreg, dreg, sreg);
219 /* If dreg == sreg, this clobbers IP */
221 emit_sub_imm (guint8 *code, int dreg, int sreg, int imm)
223 int imm8, rot_amount;
224 if ((imm8 = mono_arm_is_rotated_imm8 (imm, &rot_amount)) >= 0) {
225 ARM_SUB_REG_IMM (code, dreg, sreg, imm8, rot_amount);
229 code = mono_arm_emit_load_imm (code, ARMREG_IP, imm);
230 ARM_SUB_REG_REG (code, dreg, sreg, ARMREG_IP);
232 code = mono_arm_emit_load_imm (code, dreg, imm);
233 ARM_SUB_REG_REG (code, dreg, dreg, sreg);
239 emit_memcpy (guint8 *code, int size, int dreg, int doffset, int sreg, int soffset)
241 /* we can use r0-r3, since this is called only for incoming args on the stack */
242 if (size > sizeof (gpointer) * 4) {
244 code = emit_big_add (code, ARMREG_R0, sreg, soffset);
245 code = emit_big_add (code, ARMREG_R1, dreg, doffset);
246 start_loop = code = mono_arm_emit_load_imm (code, ARMREG_R2, size);
247 ARM_LDR_IMM (code, ARMREG_R3, ARMREG_R0, 0);
248 ARM_STR_IMM (code, ARMREG_R3, ARMREG_R1, 0);
249 ARM_ADD_REG_IMM8 (code, ARMREG_R0, ARMREG_R0, 4);
250 ARM_ADD_REG_IMM8 (code, ARMREG_R1, ARMREG_R1, 4);
251 ARM_SUBS_REG_IMM8 (code, ARMREG_R2, ARMREG_R2, 4);
252 ARM_B_COND (code, ARMCOND_NE, 0);
253 arm_patch (code - 4, start_loop);
256 if (arm_is_imm12 (doffset) && arm_is_imm12 (doffset + size) &&
257 arm_is_imm12 (soffset) && arm_is_imm12 (soffset + size)) {
259 ARM_LDR_IMM (code, ARMREG_LR, sreg, soffset);
260 ARM_STR_IMM (code, ARMREG_LR, dreg, doffset);
266 code = emit_big_add (code, ARMREG_R0, sreg, soffset);
267 code = emit_big_add (code, ARMREG_R1, dreg, doffset);
268 doffset = soffset = 0;
270 ARM_LDR_IMM (code, ARMREG_LR, ARMREG_R0, soffset);
271 ARM_STR_IMM (code, ARMREG_LR, ARMREG_R1, doffset);
277 g_assert (size == 0);
282 emit_call_reg (guint8 *code, int reg)
285 ARM_BLX_REG (code, reg);
287 ARM_MOV_REG_REG (code, ARMREG_LR, ARMREG_PC);
291 ARM_MOV_REG_REG (code, ARMREG_PC, reg);
297 emit_call_seq (MonoCompile *cfg, guint8 *code)
299 if (cfg->method->dynamic) {
300 ARM_LDR_IMM (code, ARMREG_IP, ARMREG_PC, 0);
302 *(gpointer*)code = NULL;
304 code = emit_call_reg (code, ARMREG_IP);
308 cfg->thunk_area += THUNK_SIZE;
313 mono_arm_patchable_b (guint8 *code, int cond)
315 ARM_B_COND (code, cond, 0);
320 mono_arm_patchable_bl (guint8 *code, int cond)
322 ARM_BL_COND (code, cond, 0);
326 #if defined(__ARM_EABI__) && defined(__linux__) && !defined(PLATFORM_ANDROID) && !defined(MONO_CROSS_COMPILE)
327 #define HAVE_AEABI_READ_TP 1
330 #ifdef HAVE_AEABI_READ_TP
331 gpointer __aeabi_read_tp (void);
335 mono_arch_have_fast_tls (void)
337 #ifdef HAVE_AEABI_READ_TP
338 static gboolean have_fast_tls = FALSE;
339 static gboolean inited = FALSE;
341 if (mini_get_debug_options ()->use_fallback_tls)
345 return have_fast_tls;
350 tp1 = __aeabi_read_tp ();
351 asm volatile("mrc p15, 0, %0, c13, c0, 3" : "=r" (tp2));
353 have_fast_tls = tp1 && tp1 == tp2;
356 return have_fast_tls;
363 emit_tls_get (guint8 *code, int dreg, int tls_offset)
365 g_assert (v7_supported);
366 ARM_MRC (code, 15, 0, dreg, 13, 0, 3);
367 ARM_LDR_IMM (code, dreg, dreg, tls_offset);
372 emit_tls_set (guint8 *code, int sreg, int tls_offset)
374 int tp_reg = (sreg != ARMREG_R0) ? ARMREG_R0 : ARMREG_R1;
375 g_assert (v7_supported);
376 ARM_MRC (code, 15, 0, tp_reg, 13, 0, 3);
377 ARM_STR_IMM (code, sreg, tp_reg, tls_offset);
384 * Emit code to push an LMF structure on the LMF stack.
385 * On arm, this is intermixed with the initialization of other fields of the structure.
388 emit_save_lmf (MonoCompile *cfg, guint8 *code, gint32 lmf_offset)
392 if (mono_arch_have_fast_tls () && mono_tls_get_tls_offset (TLS_KEY_LMF_ADDR) != -1) {
393 code = emit_tls_get (code, ARMREG_R0, mono_tls_get_tls_offset (TLS_KEY_LMF_ADDR));
395 mono_add_patch_info (cfg, code - cfg->native_code, MONO_PATCH_INFO_INTERNAL_METHOD,
396 (gpointer)"mono_tls_get_lmf_addr");
397 code = emit_call_seq (cfg, code);
399 /* we build the MonoLMF structure on the stack - see mini-arm.h */
400 /* lmf_offset is the offset from the previous stack pointer,
401 * alloc_size is the total stack space allocated, so the offset
402 * of MonoLMF from the current stack ptr is alloc_size - lmf_offset.
403 * The pointer to the struct is put in r1 (new_lmf).
404 * ip is used as scratch
405 * The callee-saved registers are already in the MonoLMF structure
407 code = emit_big_add (code, ARMREG_R1, ARMREG_SP, lmf_offset);
408 /* r0 is the result from mono_get_lmf_addr () */
409 ARM_STR_IMM (code, ARMREG_R0, ARMREG_R1, MONO_STRUCT_OFFSET (MonoLMF, lmf_addr));
410 /* new_lmf->previous_lmf = *lmf_addr */
411 ARM_LDR_IMM (code, ARMREG_IP, ARMREG_R0, MONO_STRUCT_OFFSET (MonoLMF, previous_lmf));
412 ARM_STR_IMM (code, ARMREG_IP, ARMREG_R1, MONO_STRUCT_OFFSET (MonoLMF, previous_lmf));
413 /* *(lmf_addr) = r1 */
414 ARM_STR_IMM (code, ARMREG_R1, ARMREG_R0, MONO_STRUCT_OFFSET (MonoLMF, previous_lmf));
415 /* Skip method (only needed for trampoline LMF frames) */
416 ARM_STR_IMM (code, ARMREG_SP, ARMREG_R1, MONO_STRUCT_OFFSET (MonoLMF, sp));
417 ARM_STR_IMM (code, ARMREG_FP, ARMREG_R1, MONO_STRUCT_OFFSET (MonoLMF, fp));
418 /* save the current IP */
419 ARM_MOV_REG_REG (code, ARMREG_IP, ARMREG_PC);
420 ARM_STR_IMM (code, ARMREG_IP, ARMREG_R1, MONO_STRUCT_OFFSET (MonoLMF, ip));
422 for (i = 0; i < sizeof (MonoLMF); i += sizeof (mgreg_t))
423 mini_gc_set_slot_type_from_fp (cfg, lmf_offset + i, SLOT_NOREF);
434 emit_float_args (MonoCompile *cfg, MonoCallInst *inst, guint8 *code, int *max_len, guint *offset)
438 for (list = inst->float_args; list; list = list->next) {
439 FloatArgData *fad = list->data;
440 MonoInst *var = get_vreg_to_inst (cfg, fad->vreg);
441 gboolean imm = arm_is_fpimm8 (var->inst_offset);
443 /* 4+1 insns for emit_big_add () and 1 for FLDS. */
449 if (*offset + *max_len > cfg->code_size) {
450 cfg->code_size += *max_len;
451 cfg->native_code = g_realloc (cfg->native_code, cfg->code_size);
453 code = cfg->native_code + *offset;
457 code = emit_big_add (code, ARMREG_LR, var->inst_basereg, var->inst_offset);
458 ARM_FLDS (code, fad->hreg, ARMREG_LR, 0);
460 ARM_FLDS (code, fad->hreg, var->inst_basereg, var->inst_offset);
462 *offset = code - cfg->native_code;
469 mono_arm_emit_vfp_scratch_save (MonoCompile *cfg, guint8 *code, int reg)
473 g_assert (reg == vfp_scratch1 || reg == vfp_scratch2);
475 inst = (MonoInst *) cfg->arch.vfp_scratch_slots [reg == vfp_scratch1 ? 0 : 1];
478 if (!arm_is_fpimm8 (inst->inst_offset)) {
479 code = emit_big_add (code, ARMREG_LR, inst->inst_basereg, inst->inst_offset);
480 ARM_FSTD (code, reg, ARMREG_LR, 0);
482 ARM_FSTD (code, reg, inst->inst_basereg, inst->inst_offset);
489 mono_arm_emit_vfp_scratch_restore (MonoCompile *cfg, guint8 *code, int reg)
493 g_assert (reg == vfp_scratch1 || reg == vfp_scratch2);
495 inst = (MonoInst *) cfg->arch.vfp_scratch_slots [reg == vfp_scratch1 ? 0 : 1];
498 if (!arm_is_fpimm8 (inst->inst_offset)) {
499 code = emit_big_add (code, ARMREG_LR, inst->inst_basereg, inst->inst_offset);
500 ARM_FLDD (code, reg, ARMREG_LR, 0);
502 ARM_FLDD (code, reg, inst->inst_basereg, inst->inst_offset);
511 * Emit code to pop an LMF structure from the LMF stack.
514 emit_restore_lmf (MonoCompile *cfg, guint8 *code, gint32 lmf_offset)
518 if (lmf_offset < 32) {
519 basereg = cfg->frame_reg;
524 code = emit_big_add (code, ARMREG_R2, cfg->frame_reg, lmf_offset);
527 /* ip = previous_lmf */
528 ARM_LDR_IMM (code, ARMREG_IP, basereg, offset + MONO_STRUCT_OFFSET (MonoLMF, previous_lmf));
530 ARM_LDR_IMM (code, ARMREG_LR, basereg, offset + MONO_STRUCT_OFFSET (MonoLMF, lmf_addr));
531 /* *(lmf_addr) = previous_lmf */
532 ARM_STR_IMM (code, ARMREG_IP, ARMREG_LR, MONO_STRUCT_OFFSET (MonoLMF, previous_lmf));
537 #endif /* #ifndef DISABLE_JIT */
540 * mono_arch_get_argument_info:
541 * @csig: a method signature
542 * @param_count: the number of parameters to consider
543 * @arg_info: an array to store the result infos
545 * Gathers information on parameters such as size, alignment and
546 * padding. arg_info should be large enought to hold param_count + 1 entries.
548 * Returns the size of the activation frame.
551 mono_arch_get_argument_info (MonoMethodSignature *csig, int param_count, MonoJitArgumentInfo *arg_info)
553 int k, frame_size = 0;
554 guint32 size, align, pad;
558 t = mini_get_underlying_type (csig->ret);
559 if (MONO_TYPE_ISSTRUCT (t)) {
560 frame_size += sizeof (gpointer);
564 arg_info [0].offset = offset;
567 frame_size += sizeof (gpointer);
571 arg_info [0].size = frame_size;
573 for (k = 0; k < param_count; k++) {
574 size = mini_type_stack_size_full (csig->params [k], &align, csig->pinvoke);
576 /* ignore alignment for now */
579 frame_size += pad = (align - (frame_size & (align - 1))) & (align - 1);
580 arg_info [k].pad = pad;
582 arg_info [k + 1].pad = 0;
583 arg_info [k + 1].size = size;
585 arg_info [k + 1].offset = offset;
589 align = MONO_ARCH_FRAME_ALIGNMENT;
590 frame_size += pad = (align - (frame_size & (align - 1))) & (align - 1);
591 arg_info [k].pad = pad;
596 #define MAX_ARCH_DELEGATE_PARAMS 3
599 get_delegate_invoke_impl (MonoTrampInfo **info, gboolean has_target, gboolean param_count)
601 guint8 *code, *start;
602 GSList *unwind_ops = mono_arch_get_cie_program ();
605 start = code = mono_global_codeman_reserve (12);
607 /* Replace the this argument with the target */
608 ARM_LDR_IMM (code, ARMREG_IP, ARMREG_R0, MONO_STRUCT_OFFSET (MonoDelegate, method_ptr));
609 ARM_LDR_IMM (code, ARMREG_R0, ARMREG_R0, MONO_STRUCT_OFFSET (MonoDelegate, target));
610 ARM_MOV_REG_REG (code, ARMREG_PC, ARMREG_IP);
612 g_assert ((code - start) <= 12);
614 mono_arch_flush_icache (start, 12);
618 size = 8 + param_count * 4;
619 start = code = mono_global_codeman_reserve (size);
621 ARM_LDR_IMM (code, ARMREG_IP, ARMREG_R0, MONO_STRUCT_OFFSET (MonoDelegate, method_ptr));
622 /* slide down the arguments */
623 for (i = 0; i < param_count; ++i) {
624 ARM_MOV_REG_REG (code, (ARMREG_R0 + i), (ARMREG_R0 + i + 1));
626 ARM_MOV_REG_REG (code, ARMREG_PC, ARMREG_IP);
628 g_assert ((code - start) <= size);
630 mono_arch_flush_icache (start, size);
634 *info = mono_tramp_info_create ("delegate_invoke_impl_has_target", start, code - start, NULL, unwind_ops);
636 char *name = g_strdup_printf ("delegate_invoke_impl_target_%d", param_count);
637 *info = mono_tramp_info_create (name, start, code - start, NULL, unwind_ops);
641 mono_profiler_code_buffer_new (start, code - start, MONO_PROFILER_CODE_BUFFER_DELEGATE_INVOKE, NULL);
647 * mono_arch_get_delegate_invoke_impls:
649 * Return a list of MonoAotTrampInfo structures for the delegate invoke impl
653 mono_arch_get_delegate_invoke_impls (void)
659 get_delegate_invoke_impl (&info, TRUE, 0);
660 res = g_slist_prepend (res, info);
662 for (i = 0; i <= MAX_ARCH_DELEGATE_PARAMS; ++i) {
663 get_delegate_invoke_impl (&info, FALSE, i);
664 res = g_slist_prepend (res, info);
671 mono_arch_get_delegate_invoke_impl (MonoMethodSignature *sig, gboolean has_target)
673 guint8 *code, *start;
676 /* FIXME: Support more cases */
677 sig_ret = mini_get_underlying_type (sig->ret);
678 if (MONO_TYPE_ISSTRUCT (sig_ret))
682 static guint8* cached = NULL;
683 mono_mini_arch_lock ();
685 mono_mini_arch_unlock ();
690 start = mono_aot_get_trampoline ("delegate_invoke_impl_has_target");
693 start = get_delegate_invoke_impl (&info, TRUE, 0);
694 mono_tramp_info_register (info, NULL);
697 mono_mini_arch_unlock ();
700 static guint8* cache [MAX_ARCH_DELEGATE_PARAMS + 1] = {NULL};
703 if (sig->param_count > MAX_ARCH_DELEGATE_PARAMS)
705 for (i = 0; i < sig->param_count; ++i)
706 if (!mono_is_regsize_var (sig->params [i]))
709 mono_mini_arch_lock ();
710 code = cache [sig->param_count];
712 mono_mini_arch_unlock ();
717 char *name = g_strdup_printf ("delegate_invoke_impl_target_%d", sig->param_count);
718 start = mono_aot_get_trampoline (name);
722 start = get_delegate_invoke_impl (&info, FALSE, sig->param_count);
723 mono_tramp_info_register (info, NULL);
725 cache [sig->param_count] = start;
726 mono_mini_arch_unlock ();
734 mono_arch_get_delegate_virtual_invoke_impl (MonoMethodSignature *sig, MonoMethod *method, int offset, gboolean load_imt_reg)
740 mono_arch_get_this_arg_from_call (mgreg_t *regs, guint8 *code)
742 return (gpointer)regs [ARMREG_R0];
746 * Initialize the cpu to execute managed code.
749 mono_arch_cpu_init (void)
751 i8_align = MONO_ABI_ALIGNOF (gint64);
752 #ifdef MONO_CROSS_COMPILE
753 /* Need to set the alignment of i8 since it can different on the target */
754 #ifdef TARGET_ANDROID
756 mono_type_set_alignment (MONO_TYPE_I8, i8_align);
762 * Initialize architecture specific code.
765 mono_arch_init (void)
767 const char *cpu_arch;
769 #ifdef TARGET_WATCHOS
770 mini_get_debug_options ()->soft_breakpoints = TRUE;
773 mono_os_mutex_init_recursive (&mini_arch_mutex);
774 if (mini_get_debug_options ()->soft_breakpoints) {
776 breakpoint_tramp = mini_get_breakpoint_trampoline ();
778 ss_trigger_page = mono_valloc (NULL, mono_pagesize (), MONO_MMAP_READ|MONO_MMAP_32BIT, MONO_MEM_ACCOUNT_OTHER);
779 bp_trigger_page = mono_valloc (NULL, mono_pagesize (), MONO_MMAP_READ|MONO_MMAP_32BIT, MONO_MEM_ACCOUNT_OTHER);
780 mono_mprotect (bp_trigger_page, mono_pagesize (), 0);
783 mono_aot_register_jit_icall ("mono_arm_throw_exception", mono_arm_throw_exception);
784 mono_aot_register_jit_icall ("mono_arm_throw_exception_by_token", mono_arm_throw_exception_by_token);
785 mono_aot_register_jit_icall ("mono_arm_resume_unwind", mono_arm_resume_unwind);
786 #if defined(MONO_ARCH_GSHAREDVT_SUPPORTED)
787 mono_aot_register_jit_icall ("mono_arm_start_gsharedvt_call", mono_arm_start_gsharedvt_call);
789 mono_aot_register_jit_icall ("mono_arm_unaligned_stack", mono_arm_unaligned_stack);
790 mono_aot_register_jit_icall ("mono_arm_handler_block_trampoline_helper", mono_arm_handler_block_trampoline_helper);
791 #if defined(__ARM_EABI__)
792 eabi_supported = TRUE;
795 #if defined(ARM_FPU_VFP_HARD)
796 arm_fpu = MONO_ARM_FPU_VFP_HARD;
798 arm_fpu = MONO_ARM_FPU_VFP;
800 #if defined(ARM_FPU_NONE) && !defined(TARGET_IOS)
802 * If we're compiling with a soft float fallback and it
803 * turns out that no VFP unit is available, we need to
804 * switch to soft float. We don't do this for iOS, since
805 * iOS devices always have a VFP unit.
807 if (!mono_hwcap_arm_has_vfp)
808 arm_fpu = MONO_ARM_FPU_NONE;
811 * This environment variable can be useful in testing
812 * environments to make sure the soft float fallback
813 * works. Most ARM devices have VFP units these days, so
814 * normally soft float code would not be exercised much.
816 const char *soft = g_getenv ("MONO_ARM_FORCE_SOFT_FLOAT");
818 if (soft && !strncmp (soft, "1", 1))
819 arm_fpu = MONO_ARM_FPU_NONE;
824 v5_supported = mono_hwcap_arm_is_v5;
825 v6_supported = mono_hwcap_arm_is_v6;
826 v7_supported = mono_hwcap_arm_is_v7;
829 * On weird devices, the hwcap code may fail to detect
830 * the ARM version. In that case, we can at least safely
831 * assume the version the runtime was compiled for.
843 #if defined(TARGET_IOS)
844 /* iOS is special-cased here because we don't yet
845 have a way to properly detect CPU features on it. */
846 thumb_supported = TRUE;
849 thumb_supported = mono_hwcap_arm_has_thumb;
850 thumb2_supported = mono_hwcap_arm_has_thumb2;
853 /* Format: armv(5|6|7[s])[-thumb[2]] */
854 cpu_arch = g_getenv ("MONO_CPU_ARCH");
856 /* Do this here so it overrides any detection. */
858 if (strncmp (cpu_arch, "armv", 4) == 0) {
859 v5_supported = cpu_arch [4] >= '5';
860 v6_supported = cpu_arch [4] >= '6';
861 v7_supported = cpu_arch [4] >= '7';
862 v7s_supported = strncmp (cpu_arch, "armv7s", 6) == 0;
863 v7k_supported = strncmp (cpu_arch, "armv7k", 6) == 0;
866 thumb_supported = strstr (cpu_arch, "thumb") != NULL;
867 thumb2_supported = strstr (cpu_arch, "thumb2") != NULL;
873 * Cleanup architecture specific code.
876 mono_arch_cleanup (void)
881 * This function returns the optimizations supported on this cpu.
884 mono_arch_cpu_optimizations (guint32 *exclude_mask)
886 /* no arm-specific optimizations yet */
892 * This function test for all SIMD functions supported.
894 * Returns a bitmask corresponding to all supported versions.
898 mono_arch_cpu_enumerate_simd_versions (void)
900 /* SIMD is currently unimplemented */
905 mono_arm_is_hard_float (void)
907 return arm_fpu == MONO_ARM_FPU_VFP_HARD;
913 mono_arch_opcode_needs_emulation (MonoCompile *cfg, int opcode)
915 if (v7s_supported || v7k_supported) {
929 #ifdef MONO_ARCH_SOFT_FLOAT_FALLBACK
931 mono_arch_is_soft_float (void)
933 return arm_fpu == MONO_ARM_FPU_NONE;
938 is_regsize_var (MonoType *t)
942 t = mini_get_underlying_type (t);
949 case MONO_TYPE_FNPTR:
951 case MONO_TYPE_OBJECT:
953 case MONO_TYPE_GENERICINST:
954 if (!mono_type_generic_inst_is_valuetype (t))
957 case MONO_TYPE_VALUETYPE:
964 mono_arch_get_allocatable_int_vars (MonoCompile *cfg)
969 for (i = 0; i < cfg->num_varinfo; i++) {
970 MonoInst *ins = cfg->varinfo [i];
971 MonoMethodVar *vmv = MONO_VARINFO (cfg, i);
974 if (vmv->range.first_use.abs_pos >= vmv->range.last_use.abs_pos)
977 if (ins->flags & (MONO_INST_VOLATILE|MONO_INST_INDIRECT) || (ins->opcode != OP_LOCAL && ins->opcode != OP_ARG))
980 /* we can only allocate 32 bit values */
981 if (is_regsize_var (ins->inst_vtype)) {
982 g_assert (MONO_VARINFO (cfg, i)->reg == -1);
983 g_assert (i == vmv->idx);
984 vars = mono_varlist_insert_sorted (cfg, vars, vmv, FALSE);
992 mono_arch_get_global_int_regs (MonoCompile *cfg)
996 mono_arch_compute_omit_fp (cfg);
999 * FIXME: Interface calls might go through a static rgctx trampoline which
1000 * sets V5, but it doesn't save it, so we need to save it ourselves, and
1003 if (cfg->flags & MONO_CFG_HAS_CALLS)
1004 cfg->uses_rgctx_reg = TRUE;
1006 if (cfg->arch.omit_fp)
1007 regs = g_list_prepend (regs, GUINT_TO_POINTER (ARMREG_FP));
1008 regs = g_list_prepend (regs, GUINT_TO_POINTER (ARMREG_V1));
1009 regs = g_list_prepend (regs, GUINT_TO_POINTER (ARMREG_V2));
1010 regs = g_list_prepend (regs, GUINT_TO_POINTER (ARMREG_V3));
1012 /* V4=R7 is used as a frame pointer, but V7=R10 is preserved */
1013 regs = g_list_prepend (regs, GUINT_TO_POINTER (ARMREG_V7));
1015 regs = g_list_prepend (regs, GUINT_TO_POINTER (ARMREG_V4));
1016 if (!(cfg->compile_aot || cfg->uses_rgctx_reg || COMPILE_LLVM (cfg)))
1017 /* V5 is reserved for passing the vtable/rgctx/IMT method */
1018 regs = g_list_prepend (regs, GUINT_TO_POINTER (ARMREG_V5));
1019 /*regs = g_list_prepend (regs, GUINT_TO_POINTER (ARMREG_V6));*/
1020 /*regs = g_list_prepend (regs, GUINT_TO_POINTER (ARMREG_V7));*/
1026 * mono_arch_regalloc_cost:
1028 * Return the cost, in number of memory references, of the action of
1029 * allocating the variable VMV into a register during global register
1033 mono_arch_regalloc_cost (MonoCompile *cfg, MonoMethodVar *vmv)
1039 #endif /* #ifndef DISABLE_JIT */
1042 mono_arch_flush_icache (guint8 *code, gint size)
1044 #if defined(MONO_CROSS_COMPILE)
1046 sys_icache_invalidate (code, size);
1048 __builtin___clear_cache (code, code + size);
1055 add_general (guint *gr, guint *stack_size, ArgInfo *ainfo, gboolean simple)
1058 if (*gr > ARMREG_R3) {
1060 ainfo->offset = *stack_size;
1061 ainfo->reg = ARMREG_SP; /* in the caller */
1062 ainfo->storage = RegTypeBase;
1065 ainfo->storage = RegTypeGeneral;
1072 split = i8_align == 4;
1077 if (*gr == ARMREG_R3 && split) {
1078 /* first word in r3 and the second on the stack */
1079 ainfo->offset = *stack_size;
1080 ainfo->reg = ARMREG_SP; /* in the caller */
1081 ainfo->storage = RegTypeBaseGen;
1083 } else if (*gr >= ARMREG_R3) {
1084 if (eabi_supported) {
1085 /* darwin aligns longs to 4 byte only */
1086 if (i8_align == 8) {
1091 ainfo->offset = *stack_size;
1092 ainfo->reg = ARMREG_SP; /* in the caller */
1093 ainfo->storage = RegTypeBase;
1096 if (eabi_supported) {
1097 if (i8_align == 8 && ((*gr) & 1))
1100 ainfo->storage = RegTypeIRegPair;
1109 add_float (guint *fpr, guint *stack_size, ArgInfo *ainfo, gboolean is_double, gint *float_spare)
1112 * If we're calling a function like this:
1114 * void foo(float a, double b, float c)
1116 * We pass a in s0 and b in d1. That leaves us
1117 * with s1 being unused. The armhf ABI recognizes
1118 * this and requires register assignment to then
1119 * use that for the next single-precision arg,
1120 * i.e. c in this example. So float_spare either
1121 * tells us which reg to use for the next single-
1122 * precision arg, or it's -1, meaning use *fpr.
1124 * Note that even though most of the JIT speaks
1125 * double-precision, fpr represents single-
1126 * precision registers.
1128 * See parts 5.5 and 6.1.2 of the AAPCS for how
1132 if (*fpr < ARM_VFP_F16 || (!is_double && *float_spare >= 0)) {
1133 ainfo->storage = RegTypeFP;
1137 * If we're passing a double-precision value
1138 * and *fpr is odd (e.g. it's s1, s3, ...)
1139 * we need to use the next even register. So
1140 * we mark the current *fpr as a spare that
1141 * can be used for the next single-precision
1145 *float_spare = *fpr;
1150 * At this point, we have an even register
1151 * so we assign that and move along.
1155 } else if (*float_spare >= 0) {
1157 * We're passing a single-precision value
1158 * and it looks like a spare single-
1159 * precision register is available. Let's
1163 ainfo->reg = *float_spare;
1167 * If we hit this branch, we're passing a
1168 * single-precision value and we can simply
1169 * use the next available register.
1177 * We've exhausted available floating point
1178 * regs, so pass the rest on the stack.
1186 ainfo->offset = *stack_size;
1187 ainfo->reg = ARMREG_SP;
1188 ainfo->storage = RegTypeBase;
1195 is_hfa (MonoType *t, int *out_nfields, int *out_esize)
1199 MonoClassField *field;
1200 MonoType *ftype, *prev_ftype = NULL;
1203 klass = mono_class_from_mono_type (t);
1205 while ((field = mono_class_get_fields (klass, &iter))) {
1206 if (field->type->attrs & FIELD_ATTRIBUTE_STATIC)
1208 ftype = mono_field_get_type (field);
1209 ftype = mini_get_underlying_type (ftype);
1211 if (MONO_TYPE_ISSTRUCT (ftype)) {
1212 int nested_nfields, nested_esize;
1214 if (!is_hfa (ftype, &nested_nfields, &nested_esize))
1216 if (nested_esize == 4)
1217 ftype = &mono_defaults.single_class->byval_arg;
1219 ftype = &mono_defaults.double_class->byval_arg;
1220 if (prev_ftype && prev_ftype->type != ftype->type)
1223 nfields += nested_nfields;
1225 if (!(!ftype->byref && (ftype->type == MONO_TYPE_R4 || ftype->type == MONO_TYPE_R8)))
1227 if (prev_ftype && prev_ftype->type != ftype->type)
1233 if (nfields == 0 || nfields > 4)
1235 *out_nfields = nfields;
1236 *out_esize = prev_ftype->type == MONO_TYPE_R4 ? 4 : 8;
1241 get_call_info (MonoMemPool *mp, MonoMethodSignature *sig)
1243 guint i, gr, fpr, pstart;
1245 int n = sig->hasthis + sig->param_count;
1249 guint32 stack_size = 0;
1251 gboolean is_pinvoke = sig->pinvoke;
1252 gboolean vtype_retaddr = FALSE;
1255 cinfo = mono_mempool_alloc0 (mp, sizeof (CallInfo) + (sizeof (ArgInfo) * n));
1257 cinfo = g_malloc0 (sizeof (CallInfo) + (sizeof (ArgInfo) * n));
1264 t = mini_get_underlying_type (sig->ret);
1275 case MONO_TYPE_FNPTR:
1276 case MONO_TYPE_OBJECT:
1277 cinfo->ret.storage = RegTypeGeneral;
1278 cinfo->ret.reg = ARMREG_R0;
1282 cinfo->ret.storage = RegTypeIRegPair;
1283 cinfo->ret.reg = ARMREG_R0;
1287 cinfo->ret.storage = RegTypeFP;
1289 if (t->type == MONO_TYPE_R4)
1290 cinfo->ret.size = 4;
1292 cinfo->ret.size = 8;
1294 if (IS_HARD_FLOAT) {
1295 cinfo->ret.reg = ARM_VFP_F0;
1297 cinfo->ret.reg = ARMREG_R0;
1300 case MONO_TYPE_GENERICINST:
1301 if (!mono_type_generic_inst_is_valuetype (t)) {
1302 cinfo->ret.storage = RegTypeGeneral;
1303 cinfo->ret.reg = ARMREG_R0;
1306 if (mini_is_gsharedvt_variable_type (t)) {
1307 cinfo->ret.storage = RegTypeStructByAddr;
1311 case MONO_TYPE_VALUETYPE:
1312 case MONO_TYPE_TYPEDBYREF:
1313 if (IS_HARD_FLOAT && sig->pinvoke && is_hfa (t, &nfields, &esize)) {
1314 cinfo->ret.storage = RegTypeHFA;
1316 cinfo->ret.nregs = nfields;
1317 cinfo->ret.esize = esize;
1320 int native_size = mono_class_native_size (mono_class_from_mono_type (t), &align);
1323 #ifdef TARGET_WATCHOS
1328 if (native_size <= max_size) {
1329 cinfo->ret.storage = RegTypeStructByVal;
1330 cinfo->ret.struct_size = native_size;
1331 cinfo->ret.nregs = ALIGN_TO (native_size, 4) / 4;
1333 cinfo->ret.storage = RegTypeStructByAddr;
1336 cinfo->ret.storage = RegTypeStructByAddr;
1341 case MONO_TYPE_MVAR:
1342 g_assert (mini_is_gsharedvt_type (t));
1343 cinfo->ret.storage = RegTypeStructByAddr;
1345 case MONO_TYPE_VOID:
1348 g_error ("Can't handle as return value 0x%x", sig->ret->type);
1351 vtype_retaddr = cinfo->ret.storage == RegTypeStructByAddr;
1356 * To simplify get_this_arg_reg () and LLVM integration, emit the vret arg after
1357 * the first argument, allowing 'this' to be always passed in the first arg reg.
1358 * Also do this if the first argument is a reference type, since virtual calls
1359 * are sometimes made using calli without sig->hasthis set, like in the delegate
1362 if (vtype_retaddr && !is_pinvoke && (sig->hasthis || (sig->param_count > 0 && MONO_TYPE_IS_REFERENCE (mini_get_underlying_type (sig->params [0]))))) {
1364 add_general (&gr, &stack_size, cinfo->args + 0, TRUE);
1366 add_general (&gr, &stack_size, &cinfo->args [sig->hasthis + 0], TRUE);
1370 cinfo->ret.reg = gr;
1372 cinfo->vret_arg_index = 1;
1376 add_general (&gr, &stack_size, cinfo->args + 0, TRUE);
1379 if (vtype_retaddr) {
1380 cinfo->ret.reg = gr;
1385 DEBUG(g_print("params: %d\n", sig->param_count));
1386 for (i = pstart; i < sig->param_count; ++i) {
1387 ArgInfo *ainfo = &cinfo->args [n];
1389 if ((sig->call_convention == MONO_CALL_VARARG) && (i == sig->sentinelpos)) {
1390 /* Prevent implicit arguments and sig_cookie from
1391 being passed in registers */
1394 /* Emit the signature cookie just before the implicit arguments */
1395 add_general (&gr, &stack_size, &cinfo->sig_cookie, TRUE);
1397 DEBUG(g_print("param %d: ", i));
1398 if (sig->params [i]->byref) {
1399 DEBUG(g_print("byref\n"));
1400 add_general (&gr, &stack_size, ainfo, TRUE);
1404 t = mini_get_underlying_type (sig->params [i]);
1408 cinfo->args [n].size = 1;
1409 add_general (&gr, &stack_size, ainfo, TRUE);
1413 cinfo->args [n].size = 2;
1414 add_general (&gr, &stack_size, ainfo, TRUE);
1418 cinfo->args [n].size = 4;
1419 add_general (&gr, &stack_size, ainfo, TRUE);
1424 case MONO_TYPE_FNPTR:
1425 case MONO_TYPE_OBJECT:
1426 cinfo->args [n].size = sizeof (gpointer);
1427 add_general (&gr, &stack_size, ainfo, TRUE);
1429 case MONO_TYPE_GENERICINST:
1430 if (!mono_type_generic_inst_is_valuetype (t)) {
1431 cinfo->args [n].size = sizeof (gpointer);
1432 add_general (&gr, &stack_size, ainfo, TRUE);
1435 if (mini_is_gsharedvt_variable_type (t)) {
1436 /* gsharedvt arguments are passed by ref */
1437 g_assert (mini_is_gsharedvt_type (t));
1438 add_general (&gr, &stack_size, ainfo, TRUE);
1439 switch (ainfo->storage) {
1440 case RegTypeGeneral:
1441 ainfo->storage = RegTypeGSharedVtInReg;
1444 ainfo->storage = RegTypeGSharedVtOnStack;
1447 g_assert_not_reached ();
1452 case MONO_TYPE_TYPEDBYREF:
1453 case MONO_TYPE_VALUETYPE: {
1456 int nwords, nfields, esize;
1459 if (IS_HARD_FLOAT && sig->pinvoke && is_hfa (t, &nfields, &esize)) {
1460 if (fpr + nfields < ARM_VFP_F16) {
1461 ainfo->storage = RegTypeHFA;
1463 ainfo->nregs = nfields;
1464 ainfo->esize = esize;
1475 if (t->type == MONO_TYPE_TYPEDBYREF) {
1476 size = sizeof (MonoTypedRef);
1477 align = sizeof (gpointer);
1479 MonoClass *klass = mono_class_from_mono_type (sig->params [i]);
1481 size = mono_class_native_size (klass, &align);
1483 size = mini_type_stack_size_full (t, &align, FALSE);
1485 DEBUG(g_print ("load %d bytes struct\n", size));
1487 #ifdef TARGET_WATCHOS
1488 /* Watchos pass large structures by ref */
1489 /* We only do this for pinvoke to make gsharedvt/dyncall simpler */
1490 if (sig->pinvoke && size > 16) {
1491 add_general (&gr, &stack_size, ainfo, TRUE);
1492 switch (ainfo->storage) {
1493 case RegTypeGeneral:
1494 ainfo->storage = RegTypeStructByAddr;
1497 ainfo->storage = RegTypeStructByAddrOnStack;
1500 g_assert_not_reached ();
1509 align_size += (sizeof (gpointer) - 1);
1510 align_size &= ~(sizeof (gpointer) - 1);
1511 nwords = (align_size + sizeof (gpointer) -1 ) / sizeof (gpointer);
1512 ainfo->storage = RegTypeStructByVal;
1513 ainfo->struct_size = size;
1514 ainfo->align = align;
1515 /* FIXME: align stack_size if needed */
1516 if (eabi_supported) {
1517 if (align >= 8 && (gr & 1))
1520 if (gr > ARMREG_R3) {
1522 ainfo->vtsize = nwords;
1524 int rest = ARMREG_R3 - gr + 1;
1525 int n_in_regs = rest >= nwords? nwords: rest;
1527 ainfo->size = n_in_regs;
1528 ainfo->vtsize = nwords - n_in_regs;
1531 nwords -= n_in_regs;
1533 if (sig->call_convention == MONO_CALL_VARARG)
1534 /* This matches the alignment in mono_ArgIterator_IntGetNextArg () */
1535 stack_size = ALIGN_TO (stack_size, align);
1536 ainfo->offset = stack_size;
1537 /*g_print ("offset for arg %d at %d\n", n, stack_size);*/
1538 stack_size += nwords * sizeof (gpointer);
1544 add_general (&gr, &stack_size, ainfo, FALSE);
1550 add_float (&fpr, &stack_size, ainfo, FALSE, &float_spare);
1552 add_general (&gr, &stack_size, ainfo, TRUE);
1558 add_float (&fpr, &stack_size, ainfo, TRUE, &float_spare);
1560 add_general (&gr, &stack_size, ainfo, FALSE);
1563 case MONO_TYPE_MVAR:
1564 /* gsharedvt arguments are passed by ref */
1565 g_assert (mini_is_gsharedvt_type (t));
1566 add_general (&gr, &stack_size, ainfo, TRUE);
1567 switch (ainfo->storage) {
1568 case RegTypeGeneral:
1569 ainfo->storage = RegTypeGSharedVtInReg;
1572 ainfo->storage = RegTypeGSharedVtOnStack;
1575 g_assert_not_reached ();
1579 g_error ("Can't handle 0x%x", sig->params [i]->type);
1584 /* Handle the case where there are no implicit arguments */
1585 if ((sig->call_convention == MONO_CALL_VARARG) && (i == sig->sentinelpos)) {
1586 /* Prevent implicit arguments and sig_cookie from
1587 being passed in registers */
1590 /* Emit the signature cookie just before the implicit arguments */
1591 add_general (&gr, &stack_size, &cinfo->sig_cookie, TRUE);
1594 /* align stack size to 8 */
1595 DEBUG (g_print (" stack size: %d (%d)\n", (stack_size + 15) & ~15, stack_size));
1596 stack_size = (stack_size + 7) & ~7;
1598 cinfo->stack_usage = stack_size;
1604 mono_arch_tail_call_supported (MonoCompile *cfg, MonoMethodSignature *caller_sig, MonoMethodSignature *callee_sig)
1606 MonoType *callee_ret;
1610 c1 = get_call_info (NULL, caller_sig);
1611 c2 = get_call_info (NULL, callee_sig);
1614 * Tail calls with more callee stack usage than the caller cannot be supported, since
1615 * the extra stack space would be left on the stack after the tail call.
1617 res = c1->stack_usage >= c2->stack_usage;
1618 callee_ret = mini_get_underlying_type (callee_sig->ret);
1619 if (callee_ret && MONO_TYPE_ISSTRUCT (callee_ret) && c2->ret.storage != RegTypeStructByVal)
1620 /* An address on the callee's stack is passed as the first argument */
1623 if (c2->stack_usage > 16 * 4)
1635 debug_omit_fp (void)
1638 return mono_debug_count ();
1645 * mono_arch_compute_omit_fp:
1646 * Determine whether the frame pointer can be eliminated.
1649 mono_arch_compute_omit_fp (MonoCompile *cfg)
1651 MonoMethodSignature *sig;
1652 MonoMethodHeader *header;
1656 if (cfg->arch.omit_fp_computed)
1659 header = cfg->header;
1661 sig = mono_method_signature (cfg->method);
1663 if (!cfg->arch.cinfo)
1664 cfg->arch.cinfo = get_call_info (cfg->mempool, sig);
1665 cinfo = cfg->arch.cinfo;
1668 * FIXME: Remove some of the restrictions.
1670 cfg->arch.omit_fp = TRUE;
1671 cfg->arch.omit_fp_computed = TRUE;
1673 if (cfg->disable_omit_fp)
1674 cfg->arch.omit_fp = FALSE;
1675 if (!debug_omit_fp ())
1676 cfg->arch.omit_fp = FALSE;
1678 if (cfg->method->save_lmf)
1679 cfg->arch.omit_fp = FALSE;
1681 if (cfg->flags & MONO_CFG_HAS_ALLOCA)
1682 cfg->arch.omit_fp = FALSE;
1683 if (header->num_clauses)
1684 cfg->arch.omit_fp = FALSE;
1685 if (cfg->param_area)
1686 cfg->arch.omit_fp = FALSE;
1687 if (!sig->pinvoke && (sig->call_convention == MONO_CALL_VARARG))
1688 cfg->arch.omit_fp = FALSE;
1689 if ((mono_jit_trace_calls != NULL && mono_trace_eval (cfg->method)))
1690 cfg->arch.omit_fp = FALSE;
1691 for (i = 0; i < sig->param_count + sig->hasthis; ++i) {
1692 ArgInfo *ainfo = &cinfo->args [i];
1694 if (ainfo->storage == RegTypeBase || ainfo->storage == RegTypeBaseGen || ainfo->storage == RegTypeStructByVal) {
1696 * The stack offset can only be determined when the frame
1699 cfg->arch.omit_fp = FALSE;
1704 for (i = cfg->locals_start; i < cfg->num_varinfo; i++) {
1705 MonoInst *ins = cfg->varinfo [i];
1708 locals_size += mono_type_size (ins->inst_vtype, &ialign);
1713 * Set var information according to the calling convention. arm version.
1714 * The locals var stuff should most likely be split in another method.
1717 mono_arch_allocate_vars (MonoCompile *cfg)
1719 MonoMethodSignature *sig;
1720 MonoMethodHeader *header;
1723 int i, offset, size, align, curinst;
1728 sig = mono_method_signature (cfg->method);
1730 if (!cfg->arch.cinfo)
1731 cfg->arch.cinfo = get_call_info (cfg->mempool, sig);
1732 cinfo = cfg->arch.cinfo;
1733 sig_ret = mini_get_underlying_type (sig->ret);
1735 mono_arch_compute_omit_fp (cfg);
1737 if (cfg->arch.omit_fp)
1738 cfg->frame_reg = ARMREG_SP;
1740 cfg->frame_reg = ARMREG_FP;
1742 cfg->flags |= MONO_CFG_HAS_SPILLUP;
1744 /* allow room for the vararg method args: void* and long/double */
1745 if (mono_jit_trace_calls != NULL && mono_trace_eval (cfg->method))
1746 cfg->param_area = MAX (cfg->param_area, sizeof (gpointer)*8);
1748 header = cfg->header;
1750 /* See mono_arch_get_global_int_regs () */
1751 if (cfg->flags & MONO_CFG_HAS_CALLS)
1752 cfg->uses_rgctx_reg = TRUE;
1754 if (cfg->frame_reg != ARMREG_SP)
1755 cfg->used_int_regs |= 1 << cfg->frame_reg;
1757 if (cfg->compile_aot || cfg->uses_rgctx_reg || COMPILE_LLVM (cfg))
1758 /* V5 is reserved for passing the vtable/rgctx/IMT method */
1759 cfg->used_int_regs |= (1 << MONO_ARCH_IMT_REG);
1763 if (!MONO_TYPE_ISSTRUCT (sig_ret) && cinfo->ret.storage != RegTypeStructByAddr) {
1764 if (sig_ret->type != MONO_TYPE_VOID) {
1765 cfg->ret->opcode = OP_REGVAR;
1766 cfg->ret->inst_c0 = ARMREG_R0;
1769 /* local vars are at a positive offset from the stack pointer */
1771 * also note that if the function uses alloca, we use FP
1772 * to point at the local variables.
1774 offset = 0; /* linkage area */
1775 /* align the offset to 16 bytes: not sure this is needed here */
1777 //offset &= ~(8 - 1);
1779 /* add parameter area size for called functions */
1780 offset += cfg->param_area;
1783 if (cfg->flags & MONO_CFG_HAS_FPOUT)
1786 /* allow room to save the return value */
1787 if (mono_jit_trace_calls != NULL && mono_trace_eval (cfg->method))
1790 switch (cinfo->ret.storage) {
1791 case RegTypeStructByVal:
1793 /* Allocate a local to hold the result, the epilog will copy it to the correct place */
1794 offset = ALIGN_TO (offset, 8);
1795 cfg->ret->opcode = OP_REGOFFSET;
1796 cfg->ret->inst_basereg = cfg->frame_reg;
1797 cfg->ret->inst_offset = offset;
1798 if (cinfo->ret.storage == RegTypeStructByVal)
1799 offset += cinfo->ret.nregs * sizeof (gpointer);
1803 case RegTypeStructByAddr:
1804 ins = cfg->vret_addr;
1805 offset += sizeof(gpointer) - 1;
1806 offset &= ~(sizeof(gpointer) - 1);
1807 ins->inst_offset = offset;
1808 ins->opcode = OP_REGOFFSET;
1809 ins->inst_basereg = cfg->frame_reg;
1810 if (G_UNLIKELY (cfg->verbose_level > 1)) {
1811 g_print ("vret_addr =");
1812 mono_print_ins (cfg->vret_addr);
1814 offset += sizeof(gpointer);
1820 /* Allocate these first so they have a small offset, OP_SEQ_POINT depends on this */
1821 if (cfg->arch.seq_point_info_var) {
1824 ins = cfg->arch.seq_point_info_var;
1828 offset += align - 1;
1829 offset &= ~(align - 1);
1830 ins->opcode = OP_REGOFFSET;
1831 ins->inst_basereg = cfg->frame_reg;
1832 ins->inst_offset = offset;
1835 if (cfg->arch.ss_trigger_page_var) {
1838 ins = cfg->arch.ss_trigger_page_var;
1841 offset += align - 1;
1842 offset &= ~(align - 1);
1843 ins->opcode = OP_REGOFFSET;
1844 ins->inst_basereg = cfg->frame_reg;
1845 ins->inst_offset = offset;
1849 if (cfg->arch.seq_point_ss_method_var) {
1852 ins = cfg->arch.seq_point_ss_method_var;
1855 offset += align - 1;
1856 offset &= ~(align - 1);
1857 ins->opcode = OP_REGOFFSET;
1858 ins->inst_basereg = cfg->frame_reg;
1859 ins->inst_offset = offset;
1862 if (cfg->arch.seq_point_bp_method_var) {
1865 ins = cfg->arch.seq_point_bp_method_var;
1868 offset += align - 1;
1869 offset &= ~(align - 1);
1870 ins->opcode = OP_REGOFFSET;
1871 ins->inst_basereg = cfg->frame_reg;
1872 ins->inst_offset = offset;
1876 if (cfg->has_atomic_exchange_i4 || cfg->has_atomic_cas_i4 || cfg->has_atomic_add_i4) {
1877 /* Allocate a temporary used by the atomic ops */
1881 /* Allocate a local slot to hold the sig cookie address */
1882 offset += align - 1;
1883 offset &= ~(align - 1);
1884 cfg->arch.atomic_tmp_offset = offset;
1887 cfg->arch.atomic_tmp_offset = -1;
1890 cfg->locals_min_stack_offset = offset;
1892 curinst = cfg->locals_start;
1893 for (i = curinst; i < cfg->num_varinfo; ++i) {
1896 ins = cfg->varinfo [i];
1897 if ((ins->flags & MONO_INST_IS_DEAD) || ins->opcode == OP_REGVAR || ins->opcode == OP_REGOFFSET)
1900 t = ins->inst_vtype;
1901 if (cfg->gsharedvt && mini_is_gsharedvt_variable_type (t))
1904 /* inst->backend.is_pinvoke indicates native sized value types, this is used by the
1905 * pinvoke wrappers when they call functions returning structure */
1906 if (ins->backend.is_pinvoke && MONO_TYPE_ISSTRUCT (t) && t->type != MONO_TYPE_TYPEDBYREF) {
1907 size = mono_class_native_size (mono_class_from_mono_type (t), &ualign);
1911 size = mono_type_size (t, &align);
1913 /* FIXME: if a structure is misaligned, our memcpy doesn't work,
1914 * since it loads/stores misaligned words, which don't do the right thing.
1916 if (align < 4 && size >= 4)
1918 if (ALIGN_TO (offset, align) > ALIGN_TO (offset, 4))
1919 mini_gc_set_slot_type_from_fp (cfg, ALIGN_TO (offset, 4), SLOT_NOREF);
1920 offset += align - 1;
1921 offset &= ~(align - 1);
1922 ins->opcode = OP_REGOFFSET;
1923 ins->inst_offset = offset;
1924 ins->inst_basereg = cfg->frame_reg;
1926 //g_print ("allocating local %d to %d\n", i, inst->inst_offset);
1929 cfg->locals_max_stack_offset = offset;
1933 ins = cfg->args [curinst];
1934 if (ins->opcode != OP_REGVAR) {
1935 ins->opcode = OP_REGOFFSET;
1936 ins->inst_basereg = cfg->frame_reg;
1937 offset += sizeof (gpointer) - 1;
1938 offset &= ~(sizeof (gpointer) - 1);
1939 ins->inst_offset = offset;
1940 offset += sizeof (gpointer);
1945 if (sig->call_convention == MONO_CALL_VARARG) {
1949 /* Allocate a local slot to hold the sig cookie address */
1950 offset += align - 1;
1951 offset &= ~(align - 1);
1952 cfg->sig_cookie = offset;
1956 for (i = 0; i < sig->param_count; ++i) {
1957 ainfo = cinfo->args + i;
1959 ins = cfg->args [curinst];
1961 switch (ainfo->storage) {
1963 offset = ALIGN_TO (offset, 8);
1964 ins->opcode = OP_REGOFFSET;
1965 ins->inst_basereg = cfg->frame_reg;
1966 /* These arguments are saved to the stack in the prolog */
1967 ins->inst_offset = offset;
1968 if (cfg->verbose_level >= 2)
1969 g_print ("arg %d allocated to %s+0x%0x.\n", i, mono_arch_regname (ins->inst_basereg), (int)ins->inst_offset);
1977 if (ins->opcode != OP_REGVAR) {
1978 ins->opcode = OP_REGOFFSET;
1979 ins->inst_basereg = cfg->frame_reg;
1980 size = mini_type_stack_size_full (sig->params [i], &ualign, sig->pinvoke);
1982 /* FIXME: if a structure is misaligned, our memcpy doesn't work,
1983 * since it loads/stores misaligned words, which don't do the right thing.
1985 if (align < 4 && size >= 4)
1987 /* The code in the prolog () stores words when storing vtypes received in a register */
1988 if (MONO_TYPE_ISSTRUCT (sig->params [i]))
1990 if (ALIGN_TO (offset, align) > ALIGN_TO (offset, 4))
1991 mini_gc_set_slot_type_from_fp (cfg, ALIGN_TO (offset, 4), SLOT_NOREF);
1992 offset += align - 1;
1993 offset &= ~(align - 1);
1994 ins->inst_offset = offset;
2000 /* align the offset to 8 bytes */
2001 if (ALIGN_TO (offset, 8) > ALIGN_TO (offset, 4))
2002 mini_gc_set_slot_type_from_fp (cfg, ALIGN_TO (offset, 4), SLOT_NOREF);
2007 cfg->stack_offset = offset;
2011 mono_arch_create_vars (MonoCompile *cfg)
2013 MonoMethodSignature *sig;
2017 sig = mono_method_signature (cfg->method);
2019 if (!cfg->arch.cinfo)
2020 cfg->arch.cinfo = get_call_info (cfg->mempool, sig);
2021 cinfo = cfg->arch.cinfo;
2023 if (IS_HARD_FLOAT) {
2024 for (i = 0; i < 2; i++) {
2025 MonoInst *inst = mono_compile_create_var (cfg, &mono_defaults.double_class->byval_arg, OP_LOCAL);
2026 inst->flags |= MONO_INST_VOLATILE;
2028 cfg->arch.vfp_scratch_slots [i] = (gpointer) inst;
2032 if (cinfo->ret.storage == RegTypeStructByVal)
2033 cfg->ret_var_is_local = TRUE;
2035 if (cinfo->ret.storage == RegTypeStructByAddr) {
2036 cfg->vret_addr = mono_compile_create_var (cfg, &mono_defaults.int_class->byval_arg, OP_ARG);
2037 if (G_UNLIKELY (cfg->verbose_level > 1)) {
2038 g_print ("vret_addr = ");
2039 mono_print_ins (cfg->vret_addr);
2043 if (cfg->gen_sdb_seq_points) {
2044 if (cfg->compile_aot) {
2045 MonoInst *ins = mono_compile_create_var (cfg, &mono_defaults.int_class->byval_arg, OP_LOCAL);
2046 ins->flags |= MONO_INST_VOLATILE;
2047 cfg->arch.seq_point_info_var = ins;
2049 if (!cfg->soft_breakpoints) {
2050 /* Allocate a separate variable for this to save 1 load per seq point */
2051 ins = mono_compile_create_var (cfg, &mono_defaults.int_class->byval_arg, OP_LOCAL);
2052 ins->flags |= MONO_INST_VOLATILE;
2053 cfg->arch.ss_trigger_page_var = ins;
2056 if (cfg->soft_breakpoints) {
2059 ins = mono_compile_create_var (cfg, &mono_defaults.int_class->byval_arg, OP_LOCAL);
2060 ins->flags |= MONO_INST_VOLATILE;
2061 cfg->arch.seq_point_ss_method_var = ins;
2063 ins = mono_compile_create_var (cfg, &mono_defaults.int_class->byval_arg, OP_LOCAL);
2064 ins->flags |= MONO_INST_VOLATILE;
2065 cfg->arch.seq_point_bp_method_var = ins;
2071 emit_sig_cookie (MonoCompile *cfg, MonoCallInst *call, CallInfo *cinfo)
2073 MonoMethodSignature *tmp_sig;
2076 if (call->tail_call)
2079 g_assert (cinfo->sig_cookie.storage == RegTypeBase);
2082 * mono_ArgIterator_Setup assumes the signature cookie is
2083 * passed first and all the arguments which were before it are
2084 * passed on the stack after the signature. So compensate by
2085 * passing a different signature.
2087 tmp_sig = mono_metadata_signature_dup (call->signature);
2088 tmp_sig->param_count -= call->signature->sentinelpos;
2089 tmp_sig->sentinelpos = 0;
2090 memcpy (tmp_sig->params, call->signature->params + call->signature->sentinelpos, tmp_sig->param_count * sizeof (MonoType*));
2092 sig_reg = mono_alloc_ireg (cfg);
2093 MONO_EMIT_NEW_SIGNATURECONST (cfg, sig_reg, tmp_sig);
2095 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STORE_MEMBASE_REG, ARMREG_SP, cinfo->sig_cookie.offset, sig_reg);
2100 mono_arch_get_llvm_call_info (MonoCompile *cfg, MonoMethodSignature *sig)
2105 LLVMCallInfo *linfo;
2107 n = sig->param_count + sig->hasthis;
2109 cinfo = get_call_info (cfg->mempool, sig);
2111 linfo = mono_mempool_alloc0 (cfg->mempool, sizeof (LLVMCallInfo) + (sizeof (LLVMArgInfo) * n));
2114 * LLVM always uses the native ABI while we use our own ABI, the
2115 * only difference is the handling of vtypes:
2116 * - we only pass/receive them in registers in some cases, and only
2117 * in 1 or 2 integer registers.
2119 switch (cinfo->ret.storage) {
2120 case RegTypeGeneral:
2123 case RegTypeIRegPair:
2125 case RegTypeStructByAddr:
2126 /* Vtype returned using a hidden argument */
2127 linfo->ret.storage = LLVMArgVtypeRetAddr;
2128 linfo->vret_arg_index = cinfo->vret_arg_index;
2131 case RegTypeStructByVal:
2132 /* LLVM models this by returning an int array */
2133 linfo->ret.storage = LLVMArgAsIArgs;
2134 linfo->ret.nslots = cinfo->ret.nregs;
2138 linfo->ret.storage = LLVMArgFpStruct;
2139 linfo->ret.nslots = cinfo->ret.nregs;
2140 linfo->ret.esize = cinfo->ret.esize;
2143 cfg->exception_message = g_strdup_printf ("unknown ret conv (%d)", cinfo->ret.storage);
2144 cfg->disable_llvm = TRUE;
2148 for (i = 0; i < n; ++i) {
2149 LLVMArgInfo *lainfo = &linfo->args [i];
2150 ainfo = cinfo->args + i;
2152 lainfo->storage = LLVMArgNone;
2154 switch (ainfo->storage) {
2155 case RegTypeGeneral:
2156 case RegTypeIRegPair:
2158 case RegTypeBaseGen:
2160 lainfo->storage = LLVMArgNormal;
2162 case RegTypeStructByVal:
2163 lainfo->storage = LLVMArgAsIArgs;
2164 if (eabi_supported && ainfo->align == 8) {
2165 /* LLVM models this by passing an int64 array */
2166 lainfo->nslots = ALIGN_TO (ainfo->struct_size, 8) / 8;
2169 lainfo->nslots = ainfo->struct_size / sizeof (gpointer);
2173 case RegTypeStructByAddr:
2174 case RegTypeStructByAddrOnStack:
2175 lainfo->storage = LLVMArgVtypeByRef;
2180 lainfo->storage = LLVMArgAsFpArgs;
2181 lainfo->nslots = ainfo->nregs;
2182 lainfo->esize = ainfo->esize;
2183 for (j = 0; j < ainfo->nregs; ++j)
2184 lainfo->pair_storage [j] = LLVMArgInFPReg;
2188 cfg->exception_message = g_strdup_printf ("ainfo->storage (%d)", ainfo->storage);
2189 cfg->disable_llvm = TRUE;
2199 mono_arch_emit_call (MonoCompile *cfg, MonoCallInst *call)
2202 MonoMethodSignature *sig;
2206 sig = call->signature;
2207 n = sig->param_count + sig->hasthis;
2209 cinfo = get_call_info (cfg->mempool, sig);
2211 switch (cinfo->ret.storage) {
2212 case RegTypeStructByVal:
2214 if (cinfo->ret.storage == RegTypeStructByVal && cinfo->ret.nregs == 1) {
2215 /* The JIT will transform this into a normal call */
2216 call->vret_in_reg = TRUE;
2219 if (call->inst.opcode == OP_TAILCALL)
2222 * The vtype is returned in registers, save the return area address in a local, and save the vtype into
2223 * the location pointed to by it after call in emit_move_return_value ().
2225 if (!cfg->arch.vret_addr_loc) {
2226 cfg->arch.vret_addr_loc = mono_compile_create_var (cfg, &mono_defaults.int_class->byval_arg, OP_LOCAL);
2227 /* Prevent it from being register allocated or optimized away */
2228 ((MonoInst*)cfg->arch.vret_addr_loc)->flags |= MONO_INST_VOLATILE;
2231 MONO_EMIT_NEW_UNALU (cfg, OP_MOVE, ((MonoInst*)cfg->arch.vret_addr_loc)->dreg, call->vret_var->dreg);
2233 case RegTypeStructByAddr: {
2235 MONO_INST_NEW (cfg, vtarg, OP_MOVE);
2236 vtarg->sreg1 = call->vret_var->dreg;
2237 vtarg->dreg = mono_alloc_preg (cfg);
2238 MONO_ADD_INS (cfg->cbb, vtarg);
2240 mono_call_inst_add_outarg_reg (cfg, call, vtarg->dreg, cinfo->ret.reg, FALSE);
2247 for (i = 0; i < n; ++i) {
2248 ArgInfo *ainfo = cinfo->args + i;
2251 if (i >= sig->hasthis)
2252 t = sig->params [i - sig->hasthis];
2254 t = &mono_defaults.int_class->byval_arg;
2255 t = mini_get_underlying_type (t);
2257 if ((sig->call_convention == MONO_CALL_VARARG) && (i == sig->sentinelpos)) {
2258 /* Emit the signature cookie just before the implicit arguments */
2259 emit_sig_cookie (cfg, call, cinfo);
2262 in = call->args [i];
2264 switch (ainfo->storage) {
2265 case RegTypeGeneral:
2266 case RegTypeIRegPair:
2267 if (!t->byref && ((t->type == MONO_TYPE_I8) || (t->type == MONO_TYPE_U8))) {
2268 MONO_INST_NEW (cfg, ins, OP_MOVE);
2269 ins->dreg = mono_alloc_ireg (cfg);
2270 ins->sreg1 = MONO_LVREG_LS (in->dreg);
2271 MONO_ADD_INS (cfg->cbb, ins);
2272 mono_call_inst_add_outarg_reg (cfg, call, ins->dreg, ainfo->reg, FALSE);
2274 MONO_INST_NEW (cfg, ins, OP_MOVE);
2275 ins->dreg = mono_alloc_ireg (cfg);
2276 ins->sreg1 = MONO_LVREG_MS (in->dreg);
2277 MONO_ADD_INS (cfg->cbb, ins);
2278 mono_call_inst_add_outarg_reg (cfg, call, ins->dreg, ainfo->reg + 1, FALSE);
2279 } else if (!t->byref && ((t->type == MONO_TYPE_R8) || (t->type == MONO_TYPE_R4))) {
2280 if (ainfo->size == 4) {
2281 if (IS_SOFT_FLOAT) {
2282 /* mono_emit_call_args () have already done the r8->r4 conversion */
2283 /* The converted value is in an int vreg */
2284 MONO_INST_NEW (cfg, ins, OP_MOVE);
2285 ins->dreg = mono_alloc_ireg (cfg);
2286 ins->sreg1 = in->dreg;
2287 MONO_ADD_INS (cfg->cbb, ins);
2288 mono_call_inst_add_outarg_reg (cfg, call, ins->dreg, ainfo->reg, FALSE);
2292 cfg->param_area = MAX (cfg->param_area, 8);
2293 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STORER4_MEMBASE_REG, ARMREG_SP, (cfg->param_area - 8), in->dreg);
2294 creg = mono_alloc_ireg (cfg);
2295 MONO_EMIT_NEW_LOAD_MEMBASE_OP (cfg, OP_LOAD_MEMBASE, creg, ARMREG_SP, (cfg->param_area - 8));
2296 mono_call_inst_add_outarg_reg (cfg, call, creg, ainfo->reg, FALSE);
2299 if (IS_SOFT_FLOAT) {
2300 MONO_INST_NEW (cfg, ins, OP_FGETLOW32);
2301 ins->dreg = mono_alloc_ireg (cfg);
2302 ins->sreg1 = in->dreg;
2303 MONO_ADD_INS (cfg->cbb, ins);
2304 mono_call_inst_add_outarg_reg (cfg, call, ins->dreg, ainfo->reg, FALSE);
2306 MONO_INST_NEW (cfg, ins, OP_FGETHIGH32);
2307 ins->dreg = mono_alloc_ireg (cfg);
2308 ins->sreg1 = in->dreg;
2309 MONO_ADD_INS (cfg->cbb, ins);
2310 mono_call_inst_add_outarg_reg (cfg, call, ins->dreg, ainfo->reg + 1, FALSE);
2314 cfg->param_area = MAX (cfg->param_area, 8);
2315 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STORER8_MEMBASE_REG, ARMREG_SP, (cfg->param_area - 8), in->dreg);
2316 creg = mono_alloc_ireg (cfg);
2317 MONO_EMIT_NEW_LOAD_MEMBASE_OP (cfg, OP_LOAD_MEMBASE, creg, ARMREG_SP, (cfg->param_area - 8));
2318 mono_call_inst_add_outarg_reg (cfg, call, creg, ainfo->reg, FALSE);
2319 creg = mono_alloc_ireg (cfg);
2320 MONO_EMIT_NEW_LOAD_MEMBASE_OP (cfg, OP_LOAD_MEMBASE, creg, ARMREG_SP, (cfg->param_area - 8 + 4));
2321 mono_call_inst_add_outarg_reg (cfg, call, creg, ainfo->reg + 1, FALSE);
2324 cfg->flags |= MONO_CFG_HAS_FPOUT;
2326 MONO_INST_NEW (cfg, ins, OP_MOVE);
2327 ins->dreg = mono_alloc_ireg (cfg);
2328 ins->sreg1 = in->dreg;
2329 MONO_ADD_INS (cfg->cbb, ins);
2331 mono_call_inst_add_outarg_reg (cfg, call, ins->dreg, ainfo->reg, FALSE);
2334 case RegTypeStructByVal:
2335 case RegTypeGSharedVtInReg:
2336 case RegTypeGSharedVtOnStack:
2338 case RegTypeStructByAddr:
2339 case RegTypeStructByAddrOnStack:
2340 MONO_INST_NEW (cfg, ins, OP_OUTARG_VT);
2341 ins->opcode = OP_OUTARG_VT;
2342 ins->sreg1 = in->dreg;
2343 ins->klass = in->klass;
2344 ins->inst_p0 = call;
2345 ins->inst_p1 = mono_mempool_alloc (cfg->mempool, sizeof (ArgInfo));
2346 memcpy (ins->inst_p1, ainfo, sizeof (ArgInfo));
2347 mono_call_inst_add_outarg_vt (cfg, call, ins);
2348 MONO_ADD_INS (cfg->cbb, ins);
2351 if (!t->byref && ((t->type == MONO_TYPE_I8) || (t->type == MONO_TYPE_U8))) {
2352 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STOREI8_MEMBASE_REG, ARMREG_SP, ainfo->offset, in->dreg);
2353 } else if (!t->byref && ((t->type == MONO_TYPE_R4) || (t->type == MONO_TYPE_R8))) {
2354 if (t->type == MONO_TYPE_R8) {
2355 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STORER8_MEMBASE_REG, ARMREG_SP, ainfo->offset, in->dreg);
2358 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STOREI4_MEMBASE_REG, ARMREG_SP, ainfo->offset, in->dreg);
2360 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STORER4_MEMBASE_REG, ARMREG_SP, ainfo->offset, in->dreg);
2363 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STORE_MEMBASE_REG, ARMREG_SP, ainfo->offset, in->dreg);
2366 case RegTypeBaseGen:
2367 if (!t->byref && ((t->type == MONO_TYPE_I8) || (t->type == MONO_TYPE_U8))) {
2368 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STORE_MEMBASE_REG, ARMREG_SP, ainfo->offset, (G_BYTE_ORDER == G_BIG_ENDIAN) ? MONO_LVREG_LS (in->dreg) : MONO_LVREG_MS (in->dreg));
2369 MONO_INST_NEW (cfg, ins, OP_MOVE);
2370 ins->dreg = mono_alloc_ireg (cfg);
2371 ins->sreg1 = G_BYTE_ORDER == G_BIG_ENDIAN ? MONO_LVREG_MS (in->dreg) : MONO_LVREG_LS (in->dreg);
2372 MONO_ADD_INS (cfg->cbb, ins);
2373 mono_call_inst_add_outarg_reg (cfg, call, ins->dreg, ARMREG_R3, FALSE);
2374 } else if (!t->byref && (t->type == MONO_TYPE_R8)) {
2377 /* This should work for soft-float as well */
2379 cfg->param_area = MAX (cfg->param_area, 8);
2380 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STORER8_MEMBASE_REG, ARMREG_SP, (cfg->param_area - 8), in->dreg);
2381 creg = mono_alloc_ireg (cfg);
2382 mono_call_inst_add_outarg_reg (cfg, call, creg, ARMREG_R3, FALSE);
2383 MONO_EMIT_NEW_LOAD_MEMBASE_OP (cfg, OP_LOAD_MEMBASE, creg, ARMREG_SP, (cfg->param_area - 8));
2384 creg = mono_alloc_ireg (cfg);
2385 MONO_EMIT_NEW_LOAD_MEMBASE_OP (cfg, OP_LOAD_MEMBASE, creg, ARMREG_SP, (cfg->param_area - 4));
2386 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STORE_MEMBASE_REG, ARMREG_SP, ainfo->offset, creg);
2387 cfg->flags |= MONO_CFG_HAS_FPOUT;
2389 g_assert_not_reached ();
2393 int fdreg = mono_alloc_freg (cfg);
2395 if (ainfo->size == 8) {
2396 MONO_INST_NEW (cfg, ins, OP_FMOVE);
2397 ins->sreg1 = in->dreg;
2399 MONO_ADD_INS (cfg->cbb, ins);
2401 mono_call_inst_add_outarg_reg (cfg, call, ins->dreg, ainfo->reg, TRUE);
2406 * Mono's register allocator doesn't speak single-precision registers that
2407 * overlap double-precision registers (i.e. armhf). So we have to work around
2408 * the register allocator and load the value from memory manually.
2410 * So we create a variable for the float argument and an instruction to store
2411 * the argument into the variable. We then store the list of these arguments
2412 * in call->float_args. This list is then used by emit_float_args later to
2413 * pass the arguments in the various call opcodes.
2415 * This is not very nice, and we should really try to fix the allocator.
2418 MonoInst *float_arg = mono_compile_create_var (cfg, &mono_defaults.single_class->byval_arg, OP_LOCAL);
2420 /* Make sure the instruction isn't seen as pointless and removed.
2422 float_arg->flags |= MONO_INST_VOLATILE;
2424 MONO_EMIT_NEW_UNALU (cfg, OP_FMOVE, float_arg->dreg, in->dreg);
2426 /* We use the dreg to look up the instruction later. The hreg is used to
2427 * emit the instruction that loads the value into the FP reg.
2429 fad = mono_mempool_alloc0 (cfg->mempool, sizeof (FloatArgData));
2430 fad->vreg = float_arg->dreg;
2431 fad->hreg = ainfo->reg;
2433 call->float_args = g_slist_append_mempool (cfg->mempool, call->float_args, fad);
2436 call->used_iregs |= 1 << ainfo->reg;
2437 cfg->flags |= MONO_CFG_HAS_FPOUT;
2441 g_assert_not_reached ();
2445 /* Handle the case where there are no implicit arguments */
2446 if (!sig->pinvoke && (sig->call_convention == MONO_CALL_VARARG) && (n == sig->sentinelpos))
2447 emit_sig_cookie (cfg, call, cinfo);
2449 call->call_info = cinfo;
2450 call->stack_usage = cinfo->stack_usage;
2454 add_outarg_reg (MonoCompile *cfg, MonoCallInst *call, ArgStorage storage, int reg, MonoInst *arg)
2460 MONO_INST_NEW (cfg, ins, OP_FMOVE);
2461 ins->dreg = mono_alloc_freg (cfg);
2462 ins->sreg1 = arg->dreg;
2463 MONO_ADD_INS (cfg->cbb, ins);
2464 mono_call_inst_add_outarg_reg (cfg, call, ins->dreg, reg, TRUE);
2467 g_assert_not_reached ();
2473 mono_arch_emit_outarg_vt (MonoCompile *cfg, MonoInst *ins, MonoInst *src)
2475 MonoCallInst *call = (MonoCallInst*)ins->inst_p0;
2477 ArgInfo *ainfo = ins->inst_p1;
2478 int ovf_size = ainfo->vtsize;
2479 int doffset = ainfo->offset;
2480 int struct_size = ainfo->struct_size;
2481 int i, soffset, dreg, tmpreg;
2483 switch (ainfo->storage) {
2484 case RegTypeGSharedVtInReg:
2485 case RegTypeStructByAddr:
2487 mono_call_inst_add_outarg_reg (cfg, call, src->dreg, ainfo->reg, FALSE);
2489 case RegTypeGSharedVtOnStack:
2490 case RegTypeStructByAddrOnStack:
2491 /* Pass by addr on stack */
2492 MONO_EMIT_NEW_STORE_MEMBASE (cfg, OP_STORE_MEMBASE_REG, ARMREG_SP, ainfo->offset, src->dreg);
2495 for (i = 0; i < ainfo->nregs; ++i) {
2496 if (ainfo->esize == 4)
2497 MONO_INST_NEW (cfg, load, OP_LOADR4_MEMBASE);
2499 MONO_INST_NEW (cfg, load, OP_LOADR8_MEMBASE);
2500 load->dreg = mono_alloc_freg (cfg);
2501 load->inst_basereg = src->dreg;
2502 load->inst_offset = i * ainfo->esize;
2503 MONO_ADD_INS (cfg->cbb, load);
2505 if (ainfo->esize == 4) {
2508 /* See RegTypeFP in mono_arch_emit_call () */
2509 MonoInst *float_arg = mono_compile_create_var (cfg, &mono_defaults.single_class->byval_arg, OP_LOCAL);
2510 float_arg->flags |= MONO_INST_VOLATILE;
2511 MONO_EMIT_NEW_UNALU (cfg, OP_FMOVE, float_arg->dreg, load->dreg);
2513 fad = mono_mempool_alloc0 (cfg->mempool, sizeof (FloatArgData));
2514 fad->vreg = float_arg->dreg;
2515 fad->hreg = ainfo->reg + i;
2517 call->float_args = g_slist_append_mempool (cfg->mempool, call->float_args, fad);
2519 add_outarg_reg (cfg, call, RegTypeFP, ainfo->reg + (i * 2), load);
2525 for (i = 0; i < ainfo->size; ++i) {
2526 dreg = mono_alloc_ireg (cfg);
2527 switch (struct_size) {
2529 MONO_EMIT_NEW_LOAD_MEMBASE_OP (cfg, OP_LOADU1_MEMBASE, dreg, src->dreg, soffset);
2532 MONO_EMIT_NEW_LOAD_MEMBASE_OP (cfg, OP_LOADU2_MEMBASE, dreg, src->dreg, soffset);
2535 tmpreg = mono_alloc_ireg (cfg);
2536 MONO_EMIT_NEW_LOAD_MEMBASE_OP (cfg, OP_LOADU1_MEMBASE, dreg, src->dreg, soffset);
2537 MONO_EMIT_NEW_LOAD_MEMBASE_OP (cfg, OP_LOADU1_MEMBASE, tmpreg, src->dreg, soffset + 1);
2538 MONO_EMIT_NEW_BIALU_IMM (cfg, OP_SHL_IMM, tmpreg, tmpreg, 8);
2539 MONO_EMIT_NEW_BIALU (cfg, OP_IOR, dreg, dreg, tmpreg);
2540 MONO_EMIT_NEW_LOAD_MEMBASE_OP (cfg, OP_LOADU1_MEMBASE, tmpreg, src->dreg, soffset + 2);
2541 MONO_EMIT_NEW_BIALU_IMM (cfg, OP_SHL_IMM, tmpreg, tmpreg, 16);
2542 MONO_EMIT_NEW_BIALU (cfg, OP_IOR, dreg, dreg, tmpreg);
2545 MONO_EMIT_NEW_LOAD_MEMBASE (cfg, dreg, src->dreg, soffset);
2548 mono_call_inst_add_outarg_reg (cfg, call, dreg, ainfo->reg + i, FALSE);
2549 soffset += sizeof (gpointer);
2550 struct_size -= sizeof (gpointer);
2552 //g_print ("vt size: %d at R%d + %d\n", doffset, vt->inst_basereg, vt->inst_offset);
2554 mini_emit_memcpy (cfg, ARMREG_SP, doffset, src->dreg, soffset, MIN (ovf_size * sizeof (gpointer), struct_size), struct_size < 4 ? 1 : 4);
2560 mono_arch_emit_setret (MonoCompile *cfg, MonoMethod *method, MonoInst *val)
2562 MonoType *ret = mini_get_underlying_type (mono_method_signature (method)->ret);
2565 if (ret->type == MONO_TYPE_I8 || ret->type == MONO_TYPE_U8) {
2568 if (COMPILE_LLVM (cfg)) {
2569 MONO_EMIT_NEW_UNALU (cfg, OP_MOVE, cfg->ret->dreg, val->dreg);
2571 MONO_INST_NEW (cfg, ins, OP_SETLRET);
2572 ins->sreg1 = MONO_LVREG_LS (val->dreg);
2573 ins->sreg2 = MONO_LVREG_MS (val->dreg);
2574 MONO_ADD_INS (cfg->cbb, ins);
2579 case MONO_ARM_FPU_NONE:
2580 if (ret->type == MONO_TYPE_R8) {
2583 MONO_INST_NEW (cfg, ins, OP_SETFRET);
2584 ins->dreg = cfg->ret->dreg;
2585 ins->sreg1 = val->dreg;
2586 MONO_ADD_INS (cfg->cbb, ins);
2589 if (ret->type == MONO_TYPE_R4) {
2590 /* Already converted to an int in method_to_ir () */
2591 MONO_EMIT_NEW_UNALU (cfg, OP_MOVE, cfg->ret->dreg, val->dreg);
2595 case MONO_ARM_FPU_VFP:
2596 case MONO_ARM_FPU_VFP_HARD:
2597 if (ret->type == MONO_TYPE_R8 || ret->type == MONO_TYPE_R4) {
2600 MONO_INST_NEW (cfg, ins, OP_SETFRET);
2601 ins->dreg = cfg->ret->dreg;
2602 ins->sreg1 = val->dreg;
2603 MONO_ADD_INS (cfg->cbb, ins);
2608 g_assert_not_reached ();
2612 MONO_EMIT_NEW_UNALU (cfg, OP_MOVE, cfg->ret->dreg, val->dreg);
2615 #endif /* #ifndef DISABLE_JIT */
2618 mono_arch_is_inst_imm (gint64 imm)
2624 MonoMethodSignature *sig;
2627 MonoType **param_types;
2631 dyn_call_supported (CallInfo *cinfo, MonoMethodSignature *sig)
2635 if (sig->hasthis + sig->param_count > PARAM_REGS + DYN_CALL_STACK_ARGS)
2638 switch (cinfo->ret.storage) {
2640 case RegTypeGeneral:
2641 case RegTypeIRegPair:
2642 case RegTypeStructByAddr:
2653 for (i = 0; i < cinfo->nargs; ++i) {
2654 ArgInfo *ainfo = &cinfo->args [i];
2657 switch (ainfo->storage) {
2658 case RegTypeGeneral:
2659 case RegTypeIRegPair:
2660 case RegTypeBaseGen:
2664 if (ainfo->offset >= (DYN_CALL_STACK_ARGS * sizeof (gpointer)))
2667 case RegTypeStructByVal:
2668 if (ainfo->size == 0)
2669 last_slot = PARAM_REGS + (ainfo->offset / 4) + ainfo->vtsize;
2671 last_slot = ainfo->reg + ainfo->size + ainfo->vtsize;
2672 if (last_slot >= PARAM_REGS + DYN_CALL_STACK_ARGS)
2680 // FIXME: Can't use cinfo only as it doesn't contain info about I8/float */
2681 for (i = 0; i < sig->param_count; ++i) {
2682 MonoType *t = sig->params [i];
2687 t = mini_get_underlying_type (t);
2710 mono_arch_dyn_call_prepare (MonoMethodSignature *sig)
2712 ArchDynCallInfo *info;
2716 cinfo = get_call_info (NULL, sig);
2718 if (!dyn_call_supported (cinfo, sig)) {
2723 info = g_new0 (ArchDynCallInfo, 1);
2724 // FIXME: Preprocess the info to speed up start_dyn_call ()
2726 info->cinfo = cinfo;
2727 info->rtype = mini_get_underlying_type (sig->ret);
2728 info->param_types = g_new0 (MonoType*, sig->param_count);
2729 for (i = 0; i < sig->param_count; ++i)
2730 info->param_types [i] = mini_get_underlying_type (sig->params [i]);
2732 return (MonoDynCallInfo*)info;
2736 mono_arch_dyn_call_free (MonoDynCallInfo *info)
2738 ArchDynCallInfo *ainfo = (ArchDynCallInfo*)info;
2740 g_free (ainfo->cinfo);
2745 mono_arch_start_dyn_call (MonoDynCallInfo *info, gpointer **args, guint8 *ret, guint8 *buf, int buf_len)
2747 ArchDynCallInfo *dinfo = (ArchDynCallInfo*)info;
2748 DynCallArgs *p = (DynCallArgs*)buf;
2749 int arg_index, greg, i, j, pindex;
2750 MonoMethodSignature *sig = dinfo->sig;
2752 g_assert (buf_len >= sizeof (DynCallArgs));
2762 if (sig->hasthis || dinfo->cinfo->vret_arg_index == 1) {
2763 p->regs [greg ++] = (mgreg_t)*(args [arg_index ++]);
2768 if (dinfo->cinfo->ret.storage == RegTypeStructByAddr)
2769 p->regs [greg ++] = (mgreg_t)ret;
2771 for (i = pindex; i < sig->param_count; i++) {
2772 MonoType *t = dinfo->param_types [i];
2773 gpointer *arg = args [arg_index ++];
2774 ArgInfo *ainfo = &dinfo->cinfo->args [i + sig->hasthis];
2777 if (ainfo->storage == RegTypeGeneral || ainfo->storage == RegTypeIRegPair || ainfo->storage == RegTypeStructByVal) {
2779 } else if (ainfo->storage == RegTypeFP) {
2780 } else if (ainfo->storage == RegTypeBase) {
2781 slot = PARAM_REGS + (ainfo->offset / 4);
2782 } else if (ainfo->storage == RegTypeBaseGen) {
2783 /* slot + 1 is the first stack slot, so the code below will work */
2786 g_assert_not_reached ();
2790 p->regs [slot] = (mgreg_t)*arg;
2795 case MONO_TYPE_OBJECT:
2799 p->regs [slot] = (mgreg_t)*arg;
2802 p->regs [slot] = *(guint8*)arg;
2805 p->regs [slot] = *(gint8*)arg;
2808 p->regs [slot] = *(gint16*)arg;
2811 p->regs [slot] = *(guint16*)arg;
2814 p->regs [slot] = *(gint32*)arg;
2817 p->regs [slot] = *(guint32*)arg;
2821 p->regs [slot ++] = (mgreg_t)arg [0];
2822 p->regs [slot] = (mgreg_t)arg [1];
2825 if (ainfo->storage == RegTypeFP) {
2826 float f = *(float*)arg;
2827 p->fpregs [ainfo->reg / 2] = *(double*)&f;
2830 p->regs [slot] = *(mgreg_t*)arg;
2834 if (ainfo->storage == RegTypeFP) {
2835 p->fpregs [ainfo->reg / 2] = *(double*)arg;
2838 p->regs [slot ++] = (mgreg_t)arg [0];
2839 p->regs [slot] = (mgreg_t)arg [1];
2842 case MONO_TYPE_GENERICINST:
2843 if (MONO_TYPE_IS_REFERENCE (t)) {
2844 p->regs [slot] = (mgreg_t)*arg;
2847 if (t->type == MONO_TYPE_GENERICINST && mono_class_is_nullable (mono_class_from_mono_type (t))) {
2848 MonoClass *klass = mono_class_from_mono_type (t);
2849 guint8 *nullable_buf;
2852 size = mono_class_value_size (klass, NULL);
2853 nullable_buf = g_alloca (size);
2854 g_assert (nullable_buf);
2856 /* The argument pointed to by arg is either a boxed vtype or null */
2857 mono_nullable_init (nullable_buf, (MonoObject*)arg, klass);
2859 arg = (gpointer*)nullable_buf;
2865 case MONO_TYPE_VALUETYPE:
2866 g_assert (ainfo->storage == RegTypeStructByVal);
2868 if (ainfo->size == 0)
2869 slot = PARAM_REGS + (ainfo->offset / 4);
2873 for (j = 0; j < ainfo->size + ainfo->vtsize; ++j)
2874 p->regs [slot ++] = ((mgreg_t*)arg) [j];
2877 g_assert_not_reached ();
2883 mono_arch_finish_dyn_call (MonoDynCallInfo *info, guint8 *buf)
2885 ArchDynCallInfo *ainfo = (ArchDynCallInfo*)info;
2886 DynCallArgs *p = (DynCallArgs*)buf;
2887 MonoType *ptype = ainfo->rtype;
2888 guint8 *ret = p->ret;
2889 mgreg_t res = p->res;
2890 mgreg_t res2 = p->res2;
2892 switch (ptype->type) {
2893 case MONO_TYPE_VOID:
2894 *(gpointer*)ret = NULL;
2896 case MONO_TYPE_OBJECT:
2900 *(gpointer*)ret = (gpointer)res;
2906 *(guint8*)ret = res;
2909 *(gint16*)ret = res;
2912 *(guint16*)ret = res;
2915 *(gint32*)ret = res;
2918 *(guint32*)ret = res;
2922 /* This handles endianness as well */
2923 ((gint32*)ret) [0] = res;
2924 ((gint32*)ret) [1] = res2;
2926 case MONO_TYPE_GENERICINST:
2927 if (MONO_TYPE_IS_REFERENCE (ptype)) {
2928 *(gpointer*)ret = (gpointer)res;
2933 case MONO_TYPE_VALUETYPE:
2934 g_assert (ainfo->cinfo->ret.storage == RegTypeStructByAddr);
2940 *(float*)ret = *(float*)&p->fpregs [0];
2942 *(float*)ret = *(float*)&res;
2944 case MONO_TYPE_R8: {
2948 if (IS_HARD_FLOAT) {
2949 *(double*)ret = p->fpregs [0];
2954 *(double*)ret = *(double*)®s;
2959 g_assert_not_reached ();
2966 * Allow tracing to work with this interface (with an optional argument)
2970 mono_arch_instrument_prolog (MonoCompile *cfg, void *func, void *p, gboolean enable_arguments)
2974 code = mono_arm_emit_load_imm (code, ARMREG_R0, (guint32)cfg->method);
2975 ARM_MOV_REG_IMM8 (code, ARMREG_R1, 0); /* NULL ebp for now */
2976 code = mono_arm_emit_load_imm (code, ARMREG_R2, (guint32)func);
2977 code = emit_call_reg (code, ARMREG_R2);
2991 mono_arch_instrument_epilog_full (MonoCompile *cfg, void *func, void *p, gboolean enable_arguments, gboolean preserve_argument_registers)
2994 int save_mode = SAVE_NONE;
2996 MonoMethod *method = cfg->method;
2997 MonoType *ret_type = mini_get_underlying_type (mono_method_signature (method)->ret);
2998 int rtype = ret_type->type;
2999 int save_offset = cfg->param_area;
3003 offset = code - cfg->native_code;
3004 /* we need about 16 instructions */
3005 if (offset > (cfg->code_size - 16 * 4)) {
3006 cfg->code_size *= 2;
3007 cfg->native_code = g_realloc (cfg->native_code, cfg->code_size);
3008 code = cfg->native_code + offset;
3011 case MONO_TYPE_VOID:
3012 /* special case string .ctor icall */
3013 if (strcmp (".ctor", method->name) && method->klass == mono_defaults.string_class)
3014 save_mode = SAVE_ONE;
3016 save_mode = SAVE_NONE;
3020 save_mode = SAVE_TWO;
3024 save_mode = SAVE_ONE_FP;
3026 save_mode = SAVE_ONE;
3030 save_mode = SAVE_TWO_FP;
3032 save_mode = SAVE_TWO;
3034 case MONO_TYPE_GENERICINST:
3035 if (!mono_type_generic_inst_is_valuetype (ret_type)) {
3036 save_mode = SAVE_ONE;
3040 case MONO_TYPE_VALUETYPE:
3041 save_mode = SAVE_STRUCT;
3044 save_mode = SAVE_ONE;
3048 switch (save_mode) {
3050 ARM_STR_IMM (code, ARMREG_R0, cfg->frame_reg, save_offset);
3051 ARM_STR_IMM (code, ARMREG_R1, cfg->frame_reg, save_offset + 4);
3052 if (enable_arguments) {
3053 ARM_MOV_REG_REG (code, ARMREG_R2, ARMREG_R1);
3054 ARM_MOV_REG_REG (code, ARMREG_R1, ARMREG_R0);
3058 ARM_STR_IMM (code, ARMREG_R0, cfg->frame_reg, save_offset);
3059 if (enable_arguments) {
3060 ARM_MOV_REG_REG (code, ARMREG_R1, ARMREG_R0);
3064 ARM_FSTS (code, ARM_VFP_F0, cfg->frame_reg, save_offset);
3065 if (enable_arguments) {
3066 ARM_FMRS (code, ARMREG_R1, ARM_VFP_F0);
3070 ARM_FSTD (code, ARM_VFP_D0, cfg->frame_reg, save_offset);
3071 if (enable_arguments) {
3072 ARM_FMDRR (code, ARMREG_R1, ARMREG_R2, ARM_VFP_D0);
3076 if (enable_arguments) {
3077 /* FIXME: get the actual address */
3078 ARM_MOV_REG_REG (code, ARMREG_R1, ARMREG_R0);
3086 code = mono_arm_emit_load_imm (code, ARMREG_R0, (guint32)cfg->method);
3087 code = mono_arm_emit_load_imm (code, ARMREG_IP, (guint32)func);
3088 code = emit_call_reg (code, ARMREG_IP);
3090 switch (save_mode) {
3092 ARM_LDR_IMM (code, ARMREG_R0, cfg->frame_reg, save_offset);
3093 ARM_LDR_IMM (code, ARMREG_R1, cfg->frame_reg, save_offset + 4);
3096 ARM_LDR_IMM (code, ARMREG_R0, cfg->frame_reg, save_offset);
3099 ARM_FLDS (code, ARM_VFP_F0, cfg->frame_reg, save_offset);
3102 ARM_FLDD (code, ARM_VFP_D0, cfg->frame_reg, save_offset);
3113 * The immediate field for cond branches is big enough for all reasonable methods
3115 #define EMIT_COND_BRANCH_FLAGS(ins,condcode) \
3116 if (0 && ins->inst_true_bb->native_offset) { \
3117 ARM_B_COND (code, (condcode), (code - cfg->native_code + ins->inst_true_bb->native_offset) & 0xffffff); \
3119 mono_add_patch_info (cfg, code - cfg->native_code, MONO_PATCH_INFO_BB, ins->inst_true_bb); \
3120 ARM_B_COND (code, (condcode), 0); \
3123 #define EMIT_COND_BRANCH(ins,cond) EMIT_COND_BRANCH_FLAGS(ins, branch_cc_table [(cond)])
3125 /* emit an exception if condition is fail
3127 * We assign the extra code used to throw the implicit exceptions
3128 * to cfg->bb_exit as far as the big branch handling is concerned
3130 #define EMIT_COND_SYSTEM_EXCEPTION_FLAGS(condcode,exc_name) \
3132 mono_add_patch_info (cfg, code - cfg->native_code, \
3133 MONO_PATCH_INFO_EXC, exc_name); \
3134 ARM_BL_COND (code, (condcode), 0); \
3137 #define EMIT_COND_SYSTEM_EXCEPTION(cond,exc_name) EMIT_COND_SYSTEM_EXCEPTION_FLAGS(branch_cc_table [(cond)], (exc_name))
3140 mono_arch_peephole_pass_1 (MonoCompile *cfg, MonoBasicBlock *bb)
3145 mono_arch_peephole_pass_2 (MonoCompile *cfg, MonoBasicBlock *bb)
3149 MONO_BB_FOR_EACH_INS_SAFE (bb, n, ins) {
3150 MonoInst *last_ins = mono_inst_prev (ins, FILTER_IL_SEQ_POINT);
3152 switch (ins->opcode) {
3155 /* Already done by an arch-independent pass */
3157 case OP_LOAD_MEMBASE:
3158 case OP_LOADI4_MEMBASE:
3160 * OP_STORE_MEMBASE_REG reg, offset(basereg)
3161 * OP_LOAD_MEMBASE offset(basereg), reg
3163 if (last_ins && (last_ins->opcode == OP_STOREI4_MEMBASE_REG
3164 || last_ins->opcode == OP_STORE_MEMBASE_REG) &&
3165 ins->inst_basereg == last_ins->inst_destbasereg &&
3166 ins->inst_offset == last_ins->inst_offset) {
3167 if (ins->dreg == last_ins->sreg1) {
3168 MONO_DELETE_INS (bb, ins);
3171 //static int c = 0; g_print ("MATCHX %s %d\n", cfg->method->name,c++);
3172 ins->opcode = OP_MOVE;
3173 ins->sreg1 = last_ins->sreg1;
3177 * Note: reg1 must be different from the basereg in the second load
3178 * OP_LOAD_MEMBASE offset(basereg), reg1
3179 * OP_LOAD_MEMBASE offset(basereg), reg2
3181 * OP_LOAD_MEMBASE offset(basereg), reg1
3182 * OP_MOVE reg1, reg2
3184 } if (last_ins && (last_ins->opcode == OP_LOADI4_MEMBASE
3185 || last_ins->opcode == OP_LOAD_MEMBASE) &&
3186 ins->inst_basereg != last_ins->dreg &&
3187 ins->inst_basereg == last_ins->inst_basereg &&
3188 ins->inst_offset == last_ins->inst_offset) {
3190 if (ins->dreg == last_ins->dreg) {
3191 MONO_DELETE_INS (bb, ins);
3194 ins->opcode = OP_MOVE;
3195 ins->sreg1 = last_ins->dreg;
3198 //g_assert_not_reached ();
3202 * OP_STORE_MEMBASE_IMM imm, offset(basereg)
3203 * OP_LOAD_MEMBASE offset(basereg), reg
3205 * OP_STORE_MEMBASE_IMM imm, offset(basereg)
3206 * OP_ICONST reg, imm
3208 } else if (last_ins && (last_ins->opcode == OP_STOREI4_MEMBASE_IMM
3209 || last_ins->opcode == OP_STORE_MEMBASE_IMM) &&
3210 ins->inst_basereg == last_ins->inst_destbasereg &&
3211 ins->inst_offset == last_ins->inst_offset) {
3212 //static int c = 0; g_print ("MATCHX %s %d\n", cfg->method->name,c++);
3213 ins->opcode = OP_ICONST;
3214 ins->inst_c0 = last_ins->inst_imm;
3215 g_assert_not_reached (); // check this rule
3219 case OP_LOADU1_MEMBASE:
3220 case OP_LOADI1_MEMBASE:
3221 if (last_ins && (last_ins->opcode == OP_STOREI1_MEMBASE_REG) &&
3222 ins->inst_basereg == last_ins->inst_destbasereg &&
3223 ins->inst_offset == last_ins->inst_offset) {
3224 ins->opcode = (ins->opcode == OP_LOADI1_MEMBASE) ? OP_ICONV_TO_I1 : OP_ICONV_TO_U1;
3225 ins->sreg1 = last_ins->sreg1;
3228 case OP_LOADU2_MEMBASE:
3229 case OP_LOADI2_MEMBASE:
3230 if (last_ins && (last_ins->opcode == OP_STOREI2_MEMBASE_REG) &&
3231 ins->inst_basereg == last_ins->inst_destbasereg &&
3232 ins->inst_offset == last_ins->inst_offset) {
3233 ins->opcode = (ins->opcode == OP_LOADI2_MEMBASE) ? OP_ICONV_TO_I2 : OP_ICONV_TO_U2;
3234 ins->sreg1 = last_ins->sreg1;
3238 ins->opcode = OP_MOVE;
3242 if (ins->dreg == ins->sreg1) {
3243 MONO_DELETE_INS (bb, ins);
3247 * OP_MOVE sreg, dreg
3248 * OP_MOVE dreg, sreg
3250 if (last_ins && last_ins->opcode == OP_MOVE &&
3251 ins->sreg1 == last_ins->dreg &&
3252 ins->dreg == last_ins->sreg1) {
3253 MONO_DELETE_INS (bb, ins);
3262 * the branch_cc_table should maintain the order of these
3276 branch_cc_table [] = {
3290 #define ADD_NEW_INS(cfg,dest,op) do { \
3291 MONO_INST_NEW ((cfg), (dest), (op)); \
3292 mono_bblock_insert_before_ins (bb, ins, (dest)); \
3296 map_to_reg_reg_op (int op)
3305 case OP_COMPARE_IMM:
3307 case OP_ICOMPARE_IMM:
3321 case OP_LOAD_MEMBASE:
3322 return OP_LOAD_MEMINDEX;
3323 case OP_LOADI4_MEMBASE:
3324 return OP_LOADI4_MEMINDEX;
3325 case OP_LOADU4_MEMBASE:
3326 return OP_LOADU4_MEMINDEX;
3327 case OP_LOADU1_MEMBASE:
3328 return OP_LOADU1_MEMINDEX;
3329 case OP_LOADI2_MEMBASE:
3330 return OP_LOADI2_MEMINDEX;
3331 case OP_LOADU2_MEMBASE:
3332 return OP_LOADU2_MEMINDEX;
3333 case OP_LOADI1_MEMBASE:
3334 return OP_LOADI1_MEMINDEX;
3335 case OP_STOREI1_MEMBASE_REG:
3336 return OP_STOREI1_MEMINDEX;
3337 case OP_STOREI2_MEMBASE_REG:
3338 return OP_STOREI2_MEMINDEX;
3339 case OP_STOREI4_MEMBASE_REG:
3340 return OP_STOREI4_MEMINDEX;
3341 case OP_STORE_MEMBASE_REG:
3342 return OP_STORE_MEMINDEX;
3343 case OP_STORER4_MEMBASE_REG:
3344 return OP_STORER4_MEMINDEX;
3345 case OP_STORER8_MEMBASE_REG:
3346 return OP_STORER8_MEMINDEX;
3347 case OP_STORE_MEMBASE_IMM:
3348 return OP_STORE_MEMBASE_REG;
3349 case OP_STOREI1_MEMBASE_IMM:
3350 return OP_STOREI1_MEMBASE_REG;
3351 case OP_STOREI2_MEMBASE_IMM:
3352 return OP_STOREI2_MEMBASE_REG;
3353 case OP_STOREI4_MEMBASE_IMM:
3354 return OP_STOREI4_MEMBASE_REG;
3356 g_assert_not_reached ();
3360 * Remove from the instruction list the instructions that can't be
3361 * represented with very simple instructions with no register
3365 mono_arch_lowering_pass (MonoCompile *cfg, MonoBasicBlock *bb)
3367 MonoInst *ins, *temp, *last_ins = NULL;
3368 int rot_amount, imm8, low_imm;
3370 MONO_BB_FOR_EACH_INS (bb, ins) {
3372 switch (ins->opcode) {
3376 case OP_COMPARE_IMM:
3377 case OP_ICOMPARE_IMM:
3391 if ((imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount)) < 0) {
3392 int opcode2 = mono_op_imm_to_op (ins->opcode);
3393 ADD_NEW_INS (cfg, temp, OP_ICONST);
3394 temp->inst_c0 = ins->inst_imm;
3395 temp->dreg = mono_alloc_ireg (cfg);
3396 ins->sreg2 = temp->dreg;
3398 g_error ("mono_op_imm_to_op failed for %s\n", mono_inst_name (ins->opcode));
3399 ins->opcode = opcode2;
3401 if (ins->opcode == OP_SBB || ins->opcode == OP_ISBB || ins->opcode == OP_SUBCC)
3407 if (ins->inst_imm == 1) {
3408 ins->opcode = OP_MOVE;
3411 if (ins->inst_imm == 0) {
3412 ins->opcode = OP_ICONST;
3416 imm8 = mono_is_power_of_two (ins->inst_imm);
3418 ins->opcode = OP_SHL_IMM;
3419 ins->inst_imm = imm8;
3422 ADD_NEW_INS (cfg, temp, OP_ICONST);
3423 temp->inst_c0 = ins->inst_imm;
3424 temp->dreg = mono_alloc_ireg (cfg);
3425 ins->sreg2 = temp->dreg;
3426 ins->opcode = OP_IMUL;
3432 if (ins->next && (ins->next->opcode == OP_COND_EXC_C || ins->next->opcode == OP_COND_EXC_IC))
3433 /* ARM sets the C flag to 1 if there was _no_ overflow */
3434 ins->next->opcode = OP_COND_EXC_NC;
3437 case OP_IDIV_UN_IMM:
3439 case OP_IREM_UN_IMM: {
3440 int opcode2 = mono_op_imm_to_op (ins->opcode);
3441 ADD_NEW_INS (cfg, temp, OP_ICONST);
3442 temp->inst_c0 = ins->inst_imm;
3443 temp->dreg = mono_alloc_ireg (cfg);
3444 ins->sreg2 = temp->dreg;
3446 g_error ("mono_op_imm_to_op failed for %s\n", mono_inst_name (ins->opcode));
3447 ins->opcode = opcode2;
3450 case OP_LOCALLOC_IMM:
3451 ADD_NEW_INS (cfg, temp, OP_ICONST);
3452 temp->inst_c0 = ins->inst_imm;
3453 temp->dreg = mono_alloc_ireg (cfg);
3454 ins->sreg1 = temp->dreg;
3455 ins->opcode = OP_LOCALLOC;
3457 case OP_LOAD_MEMBASE:
3458 case OP_LOADI4_MEMBASE:
3459 case OP_LOADU4_MEMBASE:
3460 case OP_LOADU1_MEMBASE:
3461 /* we can do two things: load the immed in a register
3462 * and use an indexed load, or see if the immed can be
3463 * represented as an ad_imm + a load with a smaller offset
3464 * that fits. We just do the first for now, optimize later.
3466 if (arm_is_imm12 (ins->inst_offset))
3468 ADD_NEW_INS (cfg, temp, OP_ICONST);
3469 temp->inst_c0 = ins->inst_offset;
3470 temp->dreg = mono_alloc_ireg (cfg);
3471 ins->sreg2 = temp->dreg;
3472 ins->opcode = map_to_reg_reg_op (ins->opcode);
3474 case OP_LOADI2_MEMBASE:
3475 case OP_LOADU2_MEMBASE:
3476 case OP_LOADI1_MEMBASE:
3477 if (arm_is_imm8 (ins->inst_offset))
3479 ADD_NEW_INS (cfg, temp, OP_ICONST);
3480 temp->inst_c0 = ins->inst_offset;
3481 temp->dreg = mono_alloc_ireg (cfg);
3482 ins->sreg2 = temp->dreg;
3483 ins->opcode = map_to_reg_reg_op (ins->opcode);
3485 case OP_LOADR4_MEMBASE:
3486 case OP_LOADR8_MEMBASE:
3487 if (arm_is_fpimm8 (ins->inst_offset))
3489 low_imm = ins->inst_offset & 0x1ff;
3490 if ((imm8 = mono_arm_is_rotated_imm8 (ins->inst_offset & ~0x1ff, &rot_amount)) >= 0) {
3491 ADD_NEW_INS (cfg, temp, OP_ADD_IMM);
3492 temp->inst_imm = ins->inst_offset & ~0x1ff;
3493 temp->sreg1 = ins->inst_basereg;
3494 temp->dreg = mono_alloc_ireg (cfg);
3495 ins->inst_basereg = temp->dreg;
3496 ins->inst_offset = low_imm;
3500 ADD_NEW_INS (cfg, temp, OP_ICONST);
3501 temp->inst_c0 = ins->inst_offset;
3502 temp->dreg = mono_alloc_ireg (cfg);
3504 ADD_NEW_INS (cfg, add_ins, OP_IADD);
3505 add_ins->sreg1 = ins->inst_basereg;
3506 add_ins->sreg2 = temp->dreg;
3507 add_ins->dreg = mono_alloc_ireg (cfg);
3509 ins->inst_basereg = add_ins->dreg;
3510 ins->inst_offset = 0;
3513 case OP_STORE_MEMBASE_REG:
3514 case OP_STOREI4_MEMBASE_REG:
3515 case OP_STOREI1_MEMBASE_REG:
3516 if (arm_is_imm12 (ins->inst_offset))
3518 ADD_NEW_INS (cfg, temp, OP_ICONST);
3519 temp->inst_c0 = ins->inst_offset;
3520 temp->dreg = mono_alloc_ireg (cfg);
3521 ins->sreg2 = temp->dreg;
3522 ins->opcode = map_to_reg_reg_op (ins->opcode);
3524 case OP_STOREI2_MEMBASE_REG:
3525 if (arm_is_imm8 (ins->inst_offset))
3527 ADD_NEW_INS (cfg, temp, OP_ICONST);
3528 temp->inst_c0 = ins->inst_offset;
3529 temp->dreg = mono_alloc_ireg (cfg);
3530 ins->sreg2 = temp->dreg;
3531 ins->opcode = map_to_reg_reg_op (ins->opcode);
3533 case OP_STORER4_MEMBASE_REG:
3534 case OP_STORER8_MEMBASE_REG:
3535 if (arm_is_fpimm8 (ins->inst_offset))
3537 low_imm = ins->inst_offset & 0x1ff;
3538 if ((imm8 = mono_arm_is_rotated_imm8 (ins->inst_offset & ~ 0x1ff, &rot_amount)) >= 0 && arm_is_fpimm8 (low_imm)) {
3539 ADD_NEW_INS (cfg, temp, OP_ADD_IMM);
3540 temp->inst_imm = ins->inst_offset & ~0x1ff;
3541 temp->sreg1 = ins->inst_destbasereg;
3542 temp->dreg = mono_alloc_ireg (cfg);
3543 ins->inst_destbasereg = temp->dreg;
3544 ins->inst_offset = low_imm;
3548 ADD_NEW_INS (cfg, temp, OP_ICONST);
3549 temp->inst_c0 = ins->inst_offset;
3550 temp->dreg = mono_alloc_ireg (cfg);
3552 ADD_NEW_INS (cfg, add_ins, OP_IADD);
3553 add_ins->sreg1 = ins->inst_destbasereg;
3554 add_ins->sreg2 = temp->dreg;
3555 add_ins->dreg = mono_alloc_ireg (cfg);
3557 ins->inst_destbasereg = add_ins->dreg;
3558 ins->inst_offset = 0;
3561 case OP_STORE_MEMBASE_IMM:
3562 case OP_STOREI1_MEMBASE_IMM:
3563 case OP_STOREI2_MEMBASE_IMM:
3564 case OP_STOREI4_MEMBASE_IMM:
3565 ADD_NEW_INS (cfg, temp, OP_ICONST);
3566 temp->inst_c0 = ins->inst_imm;
3567 temp->dreg = mono_alloc_ireg (cfg);
3568 ins->sreg1 = temp->dreg;
3569 ins->opcode = map_to_reg_reg_op (ins->opcode);
3571 goto loop_start; /* make it handle the possibly big ins->inst_offset */
3574 gboolean swap = FALSE;
3578 /* Optimized away */
3583 /* Some fp compares require swapped operands */
3584 switch (ins->next->opcode) {
3586 ins->next->opcode = OP_FBLT;
3590 ins->next->opcode = OP_FBLT_UN;
3594 ins->next->opcode = OP_FBGE;
3598 ins->next->opcode = OP_FBGE_UN;
3606 ins->sreg1 = ins->sreg2;
3615 bb->last_ins = last_ins;
3616 bb->max_vreg = cfg->next_vreg;
3620 mono_arch_decompose_long_opts (MonoCompile *cfg, MonoInst *long_ins)
3624 if (long_ins->opcode == OP_LNEG) {
3626 MONO_EMIT_NEW_BIALU_IMM (cfg, OP_ARM_RSBS_IMM, MONO_LVREG_LS (ins->dreg), MONO_LVREG_LS (ins->sreg1), 0);
3627 MONO_EMIT_NEW_BIALU_IMM (cfg, OP_ARM_RSC_IMM, MONO_LVREG_MS (ins->dreg), MONO_LVREG_MS (ins->sreg1), 0);
3633 emit_float_to_int (MonoCompile *cfg, guchar *code, int dreg, int sreg, int size, gboolean is_signed)
3635 /* sreg is a float, dreg is an integer reg */
3637 code = mono_arm_emit_vfp_scratch_save (cfg, code, vfp_scratch1);
3639 ARM_TOSIZD (code, vfp_scratch1, sreg);
3641 ARM_TOUIZD (code, vfp_scratch1, sreg);
3642 ARM_FMRS (code, dreg, vfp_scratch1);
3643 code = mono_arm_emit_vfp_scratch_restore (cfg, code, vfp_scratch1);
3647 ARM_AND_REG_IMM8 (code, dreg, dreg, 0xff);
3648 else if (size == 2) {
3649 ARM_SHL_IMM (code, dreg, dreg, 16);
3650 ARM_SHR_IMM (code, dreg, dreg, 16);
3654 ARM_SHL_IMM (code, dreg, dreg, 24);
3655 ARM_SAR_IMM (code, dreg, dreg, 24);
3656 } else if (size == 2) {
3657 ARM_SHL_IMM (code, dreg, dreg, 16);
3658 ARM_SAR_IMM (code, dreg, dreg, 16);
3665 emit_r4_to_int (MonoCompile *cfg, guchar *code, int dreg, int sreg, int size, gboolean is_signed)
3667 /* sreg is a float, dreg is an integer reg */
3669 code = mono_arm_emit_vfp_scratch_save (cfg, code, vfp_scratch1);
3671 ARM_TOSIZS (code, vfp_scratch1, sreg);
3673 ARM_TOUIZS (code, vfp_scratch1, sreg);
3674 ARM_FMRS (code, dreg, vfp_scratch1);
3675 code = mono_arm_emit_vfp_scratch_restore (cfg, code, vfp_scratch1);
3679 ARM_AND_REG_IMM8 (code, dreg, dreg, 0xff);
3680 else if (size == 2) {
3681 ARM_SHL_IMM (code, dreg, dreg, 16);
3682 ARM_SHR_IMM (code, dreg, dreg, 16);
3686 ARM_SHL_IMM (code, dreg, dreg, 24);
3687 ARM_SAR_IMM (code, dreg, dreg, 24);
3688 } else if (size == 2) {
3689 ARM_SHL_IMM (code, dreg, dreg, 16);
3690 ARM_SAR_IMM (code, dreg, dreg, 16);
3696 #endif /* #ifndef DISABLE_JIT */
3698 #define is_call_imm(diff) ((gint)(diff) >= -33554432 && (gint)(diff) <= 33554431)
3701 emit_thunk (guint8 *code, gconstpointer target)
3705 ARM_LDR_IMM (code, ARMREG_IP, ARMREG_PC, 0);
3706 if (thumb_supported)
3707 ARM_BX (code, ARMREG_IP);
3709 ARM_MOV_REG_REG (code, ARMREG_PC, ARMREG_IP);
3710 *(guint32*)code = (guint32)target;
3712 mono_arch_flush_icache (p, code - p);
3716 handle_thunk (MonoCompile *cfg, MonoDomain *domain, guchar *code, const guchar *target)
3718 MonoJitInfo *ji = NULL;
3719 MonoThunkJitInfo *info;
3722 guint8 *orig_target;
3723 guint8 *target_thunk;
3726 domain = mono_domain_get ();
3730 * This can be called multiple times during JITting,
3731 * save the current position in cfg->arch to avoid
3732 * doing a O(n^2) search.
3734 if (!cfg->arch.thunks) {
3735 cfg->arch.thunks = cfg->thunks;
3736 cfg->arch.thunks_size = cfg->thunk_area;
3738 thunks = cfg->arch.thunks;
3739 thunks_size = cfg->arch.thunks_size;
3741 g_print ("thunk failed %p->%p, thunk space=%d method %s", code, target, thunks_size, mono_method_full_name (cfg->method, TRUE));
3742 g_assert_not_reached ();
3745 g_assert (*(guint32*)thunks == 0);
3746 emit_thunk (thunks, target);
3747 arm_patch (code, thunks);
3749 cfg->arch.thunks += THUNK_SIZE;
3750 cfg->arch.thunks_size -= THUNK_SIZE;
3752 ji = mini_jit_info_table_find (domain, (char*)code, NULL);
3754 info = mono_jit_info_get_thunk_info (ji);
3757 thunks = (guint8*)ji->code_start + info->thunks_offset;
3758 thunks_size = info->thunks_size;
3760 orig_target = mono_arch_get_call_target (code + 4);
3762 mono_mini_arch_lock ();
3764 target_thunk = NULL;
3765 if (orig_target >= thunks && orig_target < thunks + thunks_size) {
3766 /* The call already points to a thunk, because of trampolines etc. */
3767 target_thunk = orig_target;
3769 for (p = thunks; p < thunks + thunks_size; p += THUNK_SIZE) {
3770 if (((guint32*)p) [0] == 0) {
3774 } else if (((guint32*)p) [2] == (guint32)target) {
3775 /* Thunk already points to target */
3782 //g_print ("THUNK: %p %p %p\n", code, target, target_thunk);
3784 if (!target_thunk) {
3785 mono_mini_arch_unlock ();
3786 g_print ("thunk failed %p->%p, thunk space=%d method %s", code, target, thunks_size, cfg ? mono_method_full_name (cfg->method, TRUE) : mono_method_full_name (jinfo_get_method (ji), TRUE));
3787 g_assert_not_reached ();
3790 emit_thunk (target_thunk, target);
3791 arm_patch (code, target_thunk);
3792 mono_arch_flush_icache (code, 4);
3794 mono_mini_arch_unlock ();
3799 arm_patch_general (MonoCompile *cfg, MonoDomain *domain, guchar *code, const guchar *target)
3801 guint32 *code32 = (void*)code;
3802 guint32 ins = *code32;
3803 guint32 prim = (ins >> 25) & 7;
3804 guint32 tval = GPOINTER_TO_UINT (target);
3806 //g_print ("patching 0x%08x (0x%08x) to point to 0x%08x\n", code, ins, target);
3807 if (prim == 5) { /* 101b */
3808 /* the diff starts 8 bytes from the branch opcode */
3809 gint diff = target - code - 8;
3811 gint tmask = 0xffffffff;
3812 if (tval & 1) { /* entering thumb mode */
3813 diff = target - 1 - code - 8;
3814 g_assert (thumb_supported);
3815 tbits = 0xf << 28; /* bl->blx bit pattern */
3816 g_assert ((ins & (1 << 24))); /* it must be a bl, not b instruction */
3817 /* this low bit of the displacement is moved to bit 24 in the instruction encoding */
3821 tmask = ~(1 << 24); /* clear the link bit */
3822 /*g_print ("blx to thumb: target: %p, code: %p, diff: %d, mask: %x\n", target, code, diff, tmask);*/
3827 if (diff <= 33554431) {
3829 ins = (ins & 0xff000000) | diff;
3831 *code32 = ins | tbits;
3835 /* diff between 0 and -33554432 */
3836 if (diff >= -33554432) {
3838 ins = (ins & 0xff000000) | (diff & ~0xff000000);
3840 *code32 = ins | tbits;
3845 handle_thunk (cfg, domain, code, target);
3850 * The alternative call sequences looks like this:
3852 * ldr ip, [pc] // loads the address constant
3853 * b 1f // jumps around the constant
3854 * address constant embedded in the code
3859 * There are two cases for patching:
3860 * a) at the end of method emission: in this case code points to the start
3861 * of the call sequence
3862 * b) during runtime patching of the call site: in this case code points
3863 * to the mov pc, ip instruction
3865 * We have to handle also the thunk jump code sequence:
3869 * address constant // execution never reaches here
3871 if ((ins & 0x0ffffff0) == 0x12fff10) {
3872 /* Branch and exchange: the address is constructed in a reg
3873 * We can patch BX when the code sequence is the following:
3874 * ldr ip, [pc, #0] ; 0x8
3881 guint8 *emit = (guint8*)ccode;
3882 ARM_LDR_IMM (emit, ARMREG_IP, ARMREG_PC, 0);
3884 ARM_MOV_REG_REG (emit, ARMREG_LR, ARMREG_PC);
3885 ARM_BX (emit, ARMREG_IP);
3887 /*patching from magic trampoline*/
3888 if (ins == ccode [3]) {
3889 g_assert (code32 [-4] == ccode [0]);
3890 g_assert (code32 [-3] == ccode [1]);
3891 g_assert (code32 [-1] == ccode [2]);
3892 code32 [-2] = (guint32)target;
3895 /*patching from JIT*/
3896 if (ins == ccode [0]) {
3897 g_assert (code32 [1] == ccode [1]);
3898 g_assert (code32 [3] == ccode [2]);
3899 g_assert (code32 [4] == ccode [3]);
3900 code32 [2] = (guint32)target;
3903 g_assert_not_reached ();
3904 } else if ((ins & 0x0ffffff0) == 0x12fff30) {
3912 guint8 *emit = (guint8*)ccode;
3913 ARM_LDR_IMM (emit, ARMREG_IP, ARMREG_PC, 0);
3915 ARM_BLX_REG (emit, ARMREG_IP);
3917 g_assert (code32 [-3] == ccode [0]);
3918 g_assert (code32 [-2] == ccode [1]);
3919 g_assert (code32 [0] == ccode [2]);
3921 code32 [-1] = (guint32)target;
3924 guint32 *tmp = ccode;
3925 guint8 *emit = (guint8*)tmp;
3926 ARM_LDR_IMM (emit, ARMREG_IP, ARMREG_PC, 0);
3927 ARM_MOV_REG_REG (emit, ARMREG_LR, ARMREG_PC);
3928 ARM_MOV_REG_REG (emit, ARMREG_PC, ARMREG_IP);
3929 ARM_BX (emit, ARMREG_IP);
3930 if (ins == ccode [2]) {
3931 g_assert_not_reached (); // should be -2 ...
3932 code32 [-1] = (guint32)target;
3935 if (ins == ccode [0]) {
3936 /* handles both thunk jump code and the far call sequence */
3937 code32 [2] = (guint32)target;
3940 g_assert_not_reached ();
3942 // g_print ("patched with 0x%08x\n", ins);
3946 arm_patch (guchar *code, const guchar *target)
3948 arm_patch_general (NULL, NULL, code, target);
3952 * Return the >= 0 uimm8 value if val can be represented with a byte + rotation
3953 * (with the rotation amount in *rot_amount. rot_amount is already adjusted
3954 * to be used with the emit macros.
3955 * Return -1 otherwise.
3958 mono_arm_is_rotated_imm8 (guint32 val, gint *rot_amount)
3961 for (i = 0; i < 31; i+= 2) {
3962 res = (val << (32 - i)) | (val >> i);
3965 *rot_amount = i? 32 - i: 0;
3972 * Emits in code a sequence of instructions that load the value 'val'
3973 * into the dreg register. Uses at most 4 instructions.
3976 mono_arm_emit_load_imm (guint8 *code, int dreg, guint32 val)
3978 int imm8, rot_amount;
3980 ARM_LDR_IMM (code, dreg, ARMREG_PC, 0);
3981 /* skip the constant pool */
3987 if (mini_get_debug_options()->single_imm_size && v7_supported) {
3988 ARM_MOVW_REG_IMM (code, dreg, val & 0xffff);
3989 ARM_MOVT_REG_IMM (code, dreg, (val >> 16) & 0xffff);
3993 if ((imm8 = mono_arm_is_rotated_imm8 (val, &rot_amount)) >= 0) {
3994 ARM_MOV_REG_IMM (code, dreg, imm8, rot_amount);
3995 } else if ((imm8 = mono_arm_is_rotated_imm8 (~val, &rot_amount)) >= 0) {
3996 ARM_MVN_REG_IMM (code, dreg, imm8, rot_amount);
3999 ARM_MOVW_REG_IMM (code, dreg, val & 0xffff);
4001 ARM_MOVT_REG_IMM (code, dreg, (val >> 16) & 0xffff);
4005 ARM_MOV_REG_IMM8 (code, dreg, (val & 0xFF));
4007 ARM_ADD_REG_IMM (code, dreg, dreg, (val & 0xFF00) >> 8, 24);
4009 if (val & 0xFF0000) {
4010 ARM_ADD_REG_IMM (code, dreg, dreg, (val & 0xFF0000) >> 16, 16);
4012 if (val & 0xFF000000) {
4013 ARM_ADD_REG_IMM (code, dreg, dreg, (val & 0xFF000000) >> 24, 8);
4015 } else if (val & 0xFF00) {
4016 ARM_MOV_REG_IMM (code, dreg, (val & 0xFF00) >> 8, 24);
4017 if (val & 0xFF0000) {
4018 ARM_ADD_REG_IMM (code, dreg, dreg, (val & 0xFF0000) >> 16, 16);
4020 if (val & 0xFF000000) {
4021 ARM_ADD_REG_IMM (code, dreg, dreg, (val & 0xFF000000) >> 24, 8);
4023 } else if (val & 0xFF0000) {
4024 ARM_MOV_REG_IMM (code, dreg, (val & 0xFF0000) >> 16, 16);
4025 if (val & 0xFF000000) {
4026 ARM_ADD_REG_IMM (code, dreg, dreg, (val & 0xFF000000) >> 24, 8);
4029 //g_assert_not_reached ();
4035 mono_arm_thumb_supported (void)
4037 return thumb_supported;
4041 mono_arm_eabi_supported (void)
4043 return eabi_supported;
4047 mono_arm_i8_align (void)
4055 emit_move_return_value (MonoCompile *cfg, MonoInst *ins, guint8 *code)
4060 call = (MonoCallInst*)ins;
4061 cinfo = call->call_info;
4063 switch (cinfo->ret.storage) {
4064 case RegTypeStructByVal:
4066 MonoInst *loc = cfg->arch.vret_addr_loc;
4069 if (cinfo->ret.storage == RegTypeStructByVal && cinfo->ret.nregs == 1) {
4070 /* The JIT treats this as a normal call */
4074 /* Load the destination address */
4075 g_assert (loc && loc->opcode == OP_REGOFFSET);
4077 if (arm_is_imm12 (loc->inst_offset)) {
4078 ARM_LDR_IMM (code, ARMREG_LR, loc->inst_basereg, loc->inst_offset);
4080 code = mono_arm_emit_load_imm (code, ARMREG_LR, loc->inst_offset);
4081 ARM_LDR_REG_REG (code, ARMREG_LR, loc->inst_basereg, ARMREG_LR);
4084 if (cinfo->ret.storage == RegTypeStructByVal) {
4085 int rsize = cinfo->ret.struct_size;
4087 for (i = 0; i < cinfo->ret.nregs; ++i) {
4088 g_assert (rsize >= 0);
4093 ARM_STRB_IMM (code, i, ARMREG_LR, i * 4);
4096 ARM_STRH_IMM (code, i, ARMREG_LR, i * 4);
4099 ARM_STR_IMM (code, i, ARMREG_LR, i * 4);
4105 for (i = 0; i < cinfo->ret.nregs; ++i) {
4106 if (cinfo->ret.esize == 4)
4107 ARM_FSTS (code, cinfo->ret.reg + i, ARMREG_LR, i * 4);
4109 ARM_FSTD (code, cinfo->ret.reg + (i * 2), ARMREG_LR, i * 8);
4118 switch (ins->opcode) {
4121 case OP_FCALL_MEMBASE:
4123 MonoType *sig_ret = mini_get_underlying_type (((MonoCallInst*)ins)->signature->ret);
4124 if (sig_ret->type == MONO_TYPE_R4) {
4125 if (IS_HARD_FLOAT) {
4126 ARM_CVTS (code, ins->dreg, ARM_VFP_F0);
4128 ARM_FMSR (code, ins->dreg, ARMREG_R0);
4129 ARM_CVTS (code, ins->dreg, ins->dreg);
4132 if (IS_HARD_FLOAT) {
4133 ARM_CPYD (code, ins->dreg, ARM_VFP_D0);
4135 ARM_FMDRR (code, ARMREG_R0, ARMREG_R1, ins->dreg);
4142 case OP_RCALL_MEMBASE: {
4147 sig_ret = mini_get_underlying_type (((MonoCallInst*)ins)->signature->ret);
4148 g_assert (sig_ret->type == MONO_TYPE_R4);
4149 if (IS_HARD_FLOAT) {
4150 ARM_CPYS (code, ins->dreg, ARM_VFP_F0);
4152 ARM_FMSR (code, ins->dreg, ARMREG_R0);
4153 ARM_CPYS (code, ins->dreg, ins->dreg);
4165 mono_arch_output_basic_block (MonoCompile *cfg, MonoBasicBlock *bb)
4170 guint8 *code = cfg->native_code + cfg->code_len;
4171 MonoInst *last_ins = NULL;
4172 guint last_offset = 0;
4174 int imm8, rot_amount;
4176 /* we don't align basic blocks of loops on arm */
4178 if (cfg->verbose_level > 2)
4179 g_print ("Basic block %d starting at offset 0x%x\n", bb->block_num, bb->native_offset);
4181 cpos = bb->max_offset;
4183 if (cfg->prof_options & MONO_PROFILE_COVERAGE) {
4184 //MonoCoverageInfo *cov = mono_get_coverage_info (cfg->method);
4185 //g_assert (!mono_compile_aot);
4188 // cov->data [bb->dfn].iloffset = bb->cil_code - cfg->cil_code;
4189 /* this is not thread save, but good enough */
4190 /* fixme: howto handle overflows? */
4191 //x86_inc_mem (code, &cov->data [bb->dfn].count);
4194 if (mono_break_at_bb_method && mono_method_desc_full_match (mono_break_at_bb_method, cfg->method) && bb->block_num == mono_break_at_bb_bb_num) {
4195 mono_add_patch_info (cfg, code - cfg->native_code, MONO_PATCH_INFO_INTERNAL_METHOD,
4196 (gpointer)"mono_break");
4197 code = emit_call_seq (cfg, code);
4200 MONO_BB_FOR_EACH_INS (bb, ins) {
4201 offset = code - cfg->native_code;
4203 max_len = ((guint8 *)ins_get_spec (ins->opcode))[MONO_INST_LEN];
4205 if (offset > (cfg->code_size - max_len - 16)) {
4206 cfg->code_size *= 2;
4207 cfg->native_code = g_realloc (cfg->native_code, cfg->code_size);
4208 code = cfg->native_code + offset;
4210 // if (ins->cil_code)
4211 // g_print ("cil code\n");
4212 mono_debug_record_line_number (cfg, ins, offset);
4214 switch (ins->opcode) {
4215 case OP_MEMORY_BARRIER:
4217 ARM_MOV_REG_IMM8 (code, ARMREG_R0, 0);
4218 ARM_MCR (code, 15, 0, ARMREG_R0, 7, 10, 5);
4222 code = emit_tls_get (code, ins->dreg, ins->inst_offset);
4225 code = emit_tls_set (code, ins->sreg1, ins->inst_offset);
4227 case OP_ATOMIC_EXCHANGE_I4:
4228 case OP_ATOMIC_CAS_I4:
4229 case OP_ATOMIC_ADD_I4: {
4233 g_assert (v7_supported);
4236 if (ins->sreg1 != ARMREG_IP && ins->sreg2 != ARMREG_IP && ins->sreg3 != ARMREG_IP)
4238 else if (ins->sreg1 != ARMREG_R0 && ins->sreg2 != ARMREG_R0 && ins->sreg3 != ARMREG_R0)
4240 else if (ins->sreg1 != ARMREG_R1 && ins->sreg2 != ARMREG_R1 && ins->sreg3 != ARMREG_R1)
4244 g_assert (cfg->arch.atomic_tmp_offset != -1);
4245 ARM_STR_IMM (code, tmpreg, cfg->frame_reg, cfg->arch.atomic_tmp_offset);
4247 switch (ins->opcode) {
4248 case OP_ATOMIC_EXCHANGE_I4:
4250 ARM_DMB (code, ARM_DMB_SY);
4251 ARM_LDREX_REG (code, ARMREG_LR, ins->sreg1);
4252 ARM_STREX_REG (code, tmpreg, ins->sreg2, ins->sreg1);
4253 ARM_CMP_REG_IMM (code, tmpreg, 0, 0);
4255 ARM_B_COND (code, ARMCOND_NE, 0);
4256 arm_patch (buf [1], buf [0]);
4258 case OP_ATOMIC_CAS_I4:
4259 ARM_DMB (code, ARM_DMB_SY);
4261 ARM_LDREX_REG (code, ARMREG_LR, ins->sreg1);
4262 ARM_CMP_REG_REG (code, ARMREG_LR, ins->sreg3);
4264 ARM_B_COND (code, ARMCOND_NE, 0);
4265 ARM_STREX_REG (code, tmpreg, ins->sreg2, ins->sreg1);
4266 ARM_CMP_REG_IMM (code, tmpreg, 0, 0);
4268 ARM_B_COND (code, ARMCOND_NE, 0);
4269 arm_patch (buf [2], buf [0]);
4270 arm_patch (buf [1], code);
4272 case OP_ATOMIC_ADD_I4:
4274 ARM_DMB (code, ARM_DMB_SY);
4275 ARM_LDREX_REG (code, ARMREG_LR, ins->sreg1);
4276 ARM_ADD_REG_REG (code, ARMREG_LR, ARMREG_LR, ins->sreg2);
4277 ARM_STREX_REG (code, tmpreg, ARMREG_LR, ins->sreg1);
4278 ARM_CMP_REG_IMM (code, tmpreg, 0, 0);
4280 ARM_B_COND (code, ARMCOND_NE, 0);
4281 arm_patch (buf [1], buf [0]);
4284 g_assert_not_reached ();
4287 ARM_DMB (code, ARM_DMB_SY);
4288 if (tmpreg != ins->dreg)
4289 ARM_LDR_IMM (code, tmpreg, cfg->frame_reg, cfg->arch.atomic_tmp_offset);
4290 ARM_MOV_REG_REG (code, ins->dreg, ARMREG_LR);
4293 case OP_ATOMIC_LOAD_I1:
4294 case OP_ATOMIC_LOAD_U1:
4295 case OP_ATOMIC_LOAD_I2:
4296 case OP_ATOMIC_LOAD_U2:
4297 case OP_ATOMIC_LOAD_I4:
4298 case OP_ATOMIC_LOAD_U4:
4299 case OP_ATOMIC_LOAD_R4:
4300 case OP_ATOMIC_LOAD_R8: {
4301 if (ins->backend.memory_barrier_kind == MONO_MEMORY_BARRIER_SEQ)
4302 ARM_DMB (code, ARM_DMB_SY);
4304 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_offset);
4306 switch (ins->opcode) {
4307 case OP_ATOMIC_LOAD_I1:
4308 ARM_LDRSB_REG_REG (code, ins->dreg, ins->inst_basereg, ARMREG_LR);
4310 case OP_ATOMIC_LOAD_U1:
4311 ARM_LDRB_REG_REG (code, ins->dreg, ins->inst_basereg, ARMREG_LR);
4313 case OP_ATOMIC_LOAD_I2:
4314 ARM_LDRSH_REG_REG (code, ins->dreg, ins->inst_basereg, ARMREG_LR);
4316 case OP_ATOMIC_LOAD_U2:
4317 ARM_LDRH_REG_REG (code, ins->dreg, ins->inst_basereg, ARMREG_LR);
4319 case OP_ATOMIC_LOAD_I4:
4320 case OP_ATOMIC_LOAD_U4:
4321 ARM_LDR_REG_REG (code, ins->dreg, ins->inst_basereg, ARMREG_LR);
4323 case OP_ATOMIC_LOAD_R4:
4325 ARM_ADD_REG_REG (code, ARMREG_LR, ins->inst_basereg, ARMREG_LR);
4326 ARM_FLDS (code, ins->dreg, ARMREG_LR, 0);
4328 code = mono_arm_emit_vfp_scratch_save (cfg, code, vfp_scratch1);
4329 ARM_ADD_REG_REG (code, ARMREG_LR, ins->inst_basereg, ARMREG_LR);
4330 ARM_FLDS (code, vfp_scratch1, ARMREG_LR, 0);
4331 ARM_CVTS (code, ins->dreg, vfp_scratch1);
4332 code = mono_arm_emit_vfp_scratch_restore (cfg, code, vfp_scratch1);
4335 case OP_ATOMIC_LOAD_R8:
4336 ARM_ADD_REG_REG (code, ARMREG_LR, ins->inst_basereg, ARMREG_LR);
4337 ARM_FLDD (code, ins->dreg, ARMREG_LR, 0);
4341 if (ins->backend.memory_barrier_kind != MONO_MEMORY_BARRIER_NONE)
4342 ARM_DMB (code, ARM_DMB_SY);
4345 case OP_ATOMIC_STORE_I1:
4346 case OP_ATOMIC_STORE_U1:
4347 case OP_ATOMIC_STORE_I2:
4348 case OP_ATOMIC_STORE_U2:
4349 case OP_ATOMIC_STORE_I4:
4350 case OP_ATOMIC_STORE_U4:
4351 case OP_ATOMIC_STORE_R4:
4352 case OP_ATOMIC_STORE_R8: {
4353 if (ins->backend.memory_barrier_kind != MONO_MEMORY_BARRIER_NONE)
4354 ARM_DMB (code, ARM_DMB_SY);
4356 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_offset);
4358 switch (ins->opcode) {
4359 case OP_ATOMIC_STORE_I1:
4360 case OP_ATOMIC_STORE_U1:
4361 ARM_STRB_REG_REG (code, ins->sreg1, ins->inst_destbasereg, ARMREG_LR);
4363 case OP_ATOMIC_STORE_I2:
4364 case OP_ATOMIC_STORE_U2:
4365 ARM_STRH_REG_REG (code, ins->sreg1, ins->inst_destbasereg, ARMREG_LR);
4367 case OP_ATOMIC_STORE_I4:
4368 case OP_ATOMIC_STORE_U4:
4369 ARM_STR_REG_REG (code, ins->sreg1, ins->inst_destbasereg, ARMREG_LR);
4371 case OP_ATOMIC_STORE_R4:
4373 ARM_ADD_REG_REG (code, ARMREG_LR, ins->inst_destbasereg, ARMREG_LR);
4374 ARM_FSTS (code, ins->sreg1, ARMREG_LR, 0);
4376 code = mono_arm_emit_vfp_scratch_save (cfg, code, vfp_scratch1);
4377 ARM_ADD_REG_REG (code, ARMREG_LR, ins->inst_destbasereg, ARMREG_LR);
4378 ARM_CVTD (code, vfp_scratch1, ins->sreg1);
4379 ARM_FSTS (code, vfp_scratch1, ARMREG_LR, 0);
4380 code = mono_arm_emit_vfp_scratch_restore (cfg, code, vfp_scratch1);
4383 case OP_ATOMIC_STORE_R8:
4384 ARM_ADD_REG_REG (code, ARMREG_LR, ins->inst_destbasereg, ARMREG_LR);
4385 ARM_FSTD (code, ins->sreg1, ARMREG_LR, 0);
4389 if (ins->backend.memory_barrier_kind == MONO_MEMORY_BARRIER_SEQ)
4390 ARM_DMB (code, ARM_DMB_SY);
4394 ARM_SMULL_REG_REG (code, ins->backend.reg3, ins->dreg, ins->sreg1, ins->sreg2);
4397 ARM_UMULL_REG_REG (code, ins->backend.reg3, ins->dreg, ins->sreg1, ins->sreg2);
4399 case OP_STOREI1_MEMBASE_IMM:
4400 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_imm & 0xFF);
4401 g_assert (arm_is_imm12 (ins->inst_offset));
4402 ARM_STRB_IMM (code, ARMREG_LR, ins->inst_destbasereg, ins->inst_offset);
4404 case OP_STOREI2_MEMBASE_IMM:
4405 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_imm & 0xFFFF);
4406 g_assert (arm_is_imm8 (ins->inst_offset));
4407 ARM_STRH_IMM (code, ARMREG_LR, ins->inst_destbasereg, ins->inst_offset);
4409 case OP_STORE_MEMBASE_IMM:
4410 case OP_STOREI4_MEMBASE_IMM:
4411 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_imm);
4412 g_assert (arm_is_imm12 (ins->inst_offset));
4413 ARM_STR_IMM (code, ARMREG_LR, ins->inst_destbasereg, ins->inst_offset);
4415 case OP_STOREI1_MEMBASE_REG:
4416 g_assert (arm_is_imm12 (ins->inst_offset));
4417 ARM_STRB_IMM (code, ins->sreg1, ins->inst_destbasereg, ins->inst_offset);
4419 case OP_STOREI2_MEMBASE_REG:
4420 g_assert (arm_is_imm8 (ins->inst_offset));
4421 ARM_STRH_IMM (code, ins->sreg1, ins->inst_destbasereg, ins->inst_offset);
4423 case OP_STORE_MEMBASE_REG:
4424 case OP_STOREI4_MEMBASE_REG:
4425 /* this case is special, since it happens for spill code after lowering has been called */
4426 if (arm_is_imm12 (ins->inst_offset)) {
4427 ARM_STR_IMM (code, ins->sreg1, ins->inst_destbasereg, ins->inst_offset);
4429 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_offset);
4430 ARM_STR_REG_REG (code, ins->sreg1, ins->inst_destbasereg, ARMREG_LR);
4433 case OP_STOREI1_MEMINDEX:
4434 ARM_STRB_REG_REG (code, ins->sreg1, ins->inst_destbasereg, ins->sreg2);
4436 case OP_STOREI2_MEMINDEX:
4437 ARM_STRH_REG_REG (code, ins->sreg1, ins->inst_destbasereg, ins->sreg2);
4439 case OP_STORE_MEMINDEX:
4440 case OP_STOREI4_MEMINDEX:
4441 ARM_STR_REG_REG (code, ins->sreg1, ins->inst_destbasereg, ins->sreg2);
4444 g_assert_not_reached ();
4446 case OP_LOAD_MEMINDEX:
4447 case OP_LOADI4_MEMINDEX:
4448 case OP_LOADU4_MEMINDEX:
4449 ARM_LDR_REG_REG (code, ins->dreg, ins->inst_basereg, ins->sreg2);
4451 case OP_LOADI1_MEMINDEX:
4452 ARM_LDRSB_REG_REG (code, ins->dreg, ins->inst_basereg, ins->sreg2);
4454 case OP_LOADU1_MEMINDEX:
4455 ARM_LDRB_REG_REG (code, ins->dreg, ins->inst_basereg, ins->sreg2);
4457 case OP_LOADI2_MEMINDEX:
4458 ARM_LDRSH_REG_REG (code, ins->dreg, ins->inst_basereg, ins->sreg2);
4460 case OP_LOADU2_MEMINDEX:
4461 ARM_LDRH_REG_REG (code, ins->dreg, ins->inst_basereg, ins->sreg2);
4463 case OP_LOAD_MEMBASE:
4464 case OP_LOADI4_MEMBASE:
4465 case OP_LOADU4_MEMBASE:
4466 /* this case is special, since it happens for spill code after lowering has been called */
4467 if (arm_is_imm12 (ins->inst_offset)) {
4468 ARM_LDR_IMM (code, ins->dreg, ins->inst_basereg, ins->inst_offset);
4470 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_offset);
4471 ARM_LDR_REG_REG (code, ins->dreg, ins->inst_basereg, ARMREG_LR);
4474 case OP_LOADI1_MEMBASE:
4475 g_assert (arm_is_imm8 (ins->inst_offset));
4476 ARM_LDRSB_IMM (code, ins->dreg, ins->inst_basereg, ins->inst_offset);
4478 case OP_LOADU1_MEMBASE:
4479 g_assert (arm_is_imm12 (ins->inst_offset));
4480 ARM_LDRB_IMM (code, ins->dreg, ins->inst_basereg, ins->inst_offset);
4482 case OP_LOADU2_MEMBASE:
4483 g_assert (arm_is_imm8 (ins->inst_offset));
4484 ARM_LDRH_IMM (code, ins->dreg, ins->inst_basereg, ins->inst_offset);
4486 case OP_LOADI2_MEMBASE:
4487 g_assert (arm_is_imm8 (ins->inst_offset));
4488 ARM_LDRSH_IMM (code, ins->dreg, ins->inst_basereg, ins->inst_offset);
4490 case OP_ICONV_TO_I1:
4491 ARM_SHL_IMM (code, ins->dreg, ins->sreg1, 24);
4492 ARM_SAR_IMM (code, ins->dreg, ins->dreg, 24);
4494 case OP_ICONV_TO_I2:
4495 ARM_SHL_IMM (code, ins->dreg, ins->sreg1, 16);
4496 ARM_SAR_IMM (code, ins->dreg, ins->dreg, 16);
4498 case OP_ICONV_TO_U1:
4499 ARM_AND_REG_IMM8 (code, ins->dreg, ins->sreg1, 0xff);
4501 case OP_ICONV_TO_U2:
4502 ARM_SHL_IMM (code, ins->dreg, ins->sreg1, 16);
4503 ARM_SHR_IMM (code, ins->dreg, ins->dreg, 16);
4507 ARM_CMP_REG_REG (code, ins->sreg1, ins->sreg2);
4509 case OP_COMPARE_IMM:
4510 case OP_ICOMPARE_IMM:
4511 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4512 g_assert (imm8 >= 0);
4513 ARM_CMP_REG_IMM (code, ins->sreg1, imm8, rot_amount);
4517 * gdb does not like encountering the hw breakpoint ins in the debugged code.
4518 * So instead of emitting a trap, we emit a call a C function and place a
4521 //*(int*)code = 0xef9f0001;
4524 mono_add_patch_info (cfg, code - cfg->native_code, MONO_PATCH_INFO_INTERNAL_METHOD,
4525 (gpointer)"mono_break");
4526 code = emit_call_seq (cfg, code);
4528 case OP_RELAXED_NOP:
4533 case OP_DUMMY_STORE:
4534 case OP_DUMMY_ICONST:
4535 case OP_DUMMY_R8CONST:
4536 case OP_NOT_REACHED:
4539 case OP_IL_SEQ_POINT:
4540 mono_add_seq_point (cfg, bb, ins, code - cfg->native_code);
4542 case OP_SEQ_POINT: {
4544 MonoInst *info_var = cfg->arch.seq_point_info_var;
4545 MonoInst *ss_trigger_page_var = cfg->arch.ss_trigger_page_var;
4546 MonoInst *ss_method_var = cfg->arch.seq_point_ss_method_var;
4547 MonoInst *bp_method_var = cfg->arch.seq_point_bp_method_var;
4549 int dreg = ARMREG_LR;
4552 if (cfg->soft_breakpoints) {
4553 g_assert (!cfg->compile_aot);
4558 * For AOT, we use one got slot per method, which will point to a
4559 * SeqPointInfo structure, containing all the information required
4560 * by the code below.
4562 if (cfg->compile_aot) {
4563 g_assert (info_var);
4564 g_assert (info_var->opcode == OP_REGOFFSET);
4565 g_assert (arm_is_imm12 (info_var->inst_offset));
4568 if (!cfg->soft_breakpoints && !cfg->compile_aot) {
4570 * Read from the single stepping trigger page. This will cause a
4571 * SIGSEGV when single stepping is enabled.
4572 * We do this _before_ the breakpoint, so single stepping after
4573 * a breakpoint is hit will step to the next IL offset.
4575 g_assert (((guint64)(gsize)ss_trigger_page >> 32) == 0);
4578 /* Single step check */
4579 if (ins->flags & MONO_INST_SINGLE_STEP_LOC) {
4580 if (cfg->soft_breakpoints) {
4581 /* Load the address of the sequence point method variable. */
4582 var = ss_method_var;
4584 g_assert (var->opcode == OP_REGOFFSET);
4585 g_assert (arm_is_imm12 (var->inst_offset));
4586 ARM_LDR_IMM (code, dreg, var->inst_basereg, var->inst_offset);
4588 /* Read the value and check whether it is non-zero. */
4589 ARM_LDR_IMM (code, dreg, dreg, 0);
4590 ARM_CMP_REG_IMM (code, dreg, 0, 0);
4591 /* Call it conditionally. */
4592 ARM_BLX_REG_COND (code, ARMCOND_NE, dreg);
4594 if (cfg->compile_aot) {
4595 /* Load the trigger page addr from the variable initialized in the prolog */
4596 var = ss_trigger_page_var;
4598 g_assert (var->opcode == OP_REGOFFSET);
4599 g_assert (arm_is_imm12 (var->inst_offset));
4600 ARM_LDR_IMM (code, dreg, var->inst_basereg, var->inst_offset);
4602 ARM_LDR_IMM (code, dreg, ARMREG_PC, 0);
4604 *(int*)code = (int)ss_trigger_page;
4607 ARM_LDR_IMM (code, dreg, dreg, 0);
4611 mono_add_seq_point (cfg, bb, ins, code - cfg->native_code);
4613 /* Breakpoint check */
4614 if (cfg->compile_aot) {
4615 guint32 offset = code - cfg->native_code;
4618 ARM_LDR_IMM (code, dreg, info_var->inst_basereg, info_var->inst_offset);
4619 /* Add the offset */
4620 val = ((offset / 4) * sizeof (guint8*)) + MONO_STRUCT_OFFSET (SeqPointInfo, bp_addrs);
4621 /* Load the info->bp_addrs [offset], which is either 0 or the address of a trigger page */
4622 if (arm_is_imm12 ((int)val)) {
4623 ARM_LDR_IMM (code, dreg, dreg, val);
4625 ARM_ADD_REG_IMM (code, dreg, dreg, (val & 0xFF), 0);
4627 ARM_ADD_REG_IMM (code, dreg, dreg, (val & 0xFF00) >> 8, 24);
4629 ARM_ADD_REG_IMM (code, dreg, dreg, (val & 0xFF0000) >> 16, 16);
4630 g_assert (!(val & 0xFF000000));
4632 ARM_LDR_IMM (code, dreg, dreg, 0);
4634 /* What is faster, a branch or a load ? */
4635 ARM_CMP_REG_IMM (code, dreg, 0, 0);
4636 /* The breakpoint instruction */
4637 if (cfg->soft_breakpoints)
4638 ARM_BLX_REG_COND (code, ARMCOND_NE, dreg);
4640 ARM_LDR_IMM_COND (code, dreg, dreg, 0, ARMCOND_NE);
4641 } else if (cfg->soft_breakpoints) {
4642 /* Load the address of the breakpoint method into ip. */
4643 var = bp_method_var;
4645 g_assert (var->opcode == OP_REGOFFSET);
4646 g_assert (arm_is_imm12 (var->inst_offset));
4647 ARM_LDR_IMM (code, dreg, var->inst_basereg, var->inst_offset);
4650 * A placeholder for a possible breakpoint inserted by
4651 * mono_arch_set_breakpoint ().
4656 * A placeholder for a possible breakpoint inserted by
4657 * mono_arch_set_breakpoint ().
4659 for (i = 0; i < 4; ++i)
4664 * Add an additional nop so skipping the bp doesn't cause the ip to point
4665 * to another IL offset.
4673 ARM_ADDS_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4676 ARM_ADD_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4680 ARM_ADCS_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4683 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4684 g_assert (imm8 >= 0);
4685 ARM_ADDS_REG_IMM (code, ins->dreg, ins->sreg1, imm8, rot_amount);
4689 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4690 g_assert (imm8 >= 0);
4691 ARM_ADD_REG_IMM (code, ins->dreg, ins->sreg1, imm8, rot_amount);
4695 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4696 g_assert (imm8 >= 0);
4697 ARM_ADCS_REG_IMM (code, ins->dreg, ins->sreg1, imm8, rot_amount);
4700 ARM_ADD_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4701 //EMIT_COND_SYSTEM_EXCEPTION_FLAGS (PPC_BR_FALSE, PPC_BR_EQ, "OverflowException");
4703 case OP_IADD_OVF_UN:
4704 ARM_ADD_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4705 //EMIT_COND_SYSTEM_EXCEPTION_FLAGS (PPC_BR_FALSE, PPC_BR_EQ, "OverflowException");
4708 ARM_SUB_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4709 //EMIT_COND_SYSTEM_EXCEPTION_FLAGS (PPC_BR_FALSE, PPC_BR_EQ, "OverflowException");
4711 case OP_ISUB_OVF_UN:
4712 ARM_SUB_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4713 //EMIT_COND_SYSTEM_EXCEPTION_FLAGS (PPC_BR_TRUE, PPC_BR_EQ, "OverflowException");
4715 case OP_ADD_OVF_CARRY:
4716 ARM_ADCS_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4717 //EMIT_COND_SYSTEM_EXCEPTION_FLAGS (PPC_BR_FALSE, PPC_BR_EQ, "OverflowException");
4719 case OP_ADD_OVF_UN_CARRY:
4720 ARM_ADCS_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4721 //EMIT_COND_SYSTEM_EXCEPTION_FLAGS (PPC_BR_FALSE, PPC_BR_EQ, "OverflowException");
4723 case OP_SUB_OVF_CARRY:
4724 ARM_SBCS_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4725 //EMIT_COND_SYSTEM_EXCEPTION_FLAGS (PPC_BR_FALSE, PPC_BR_EQ, "OverflowException");
4727 case OP_SUB_OVF_UN_CARRY:
4728 ARM_SBCS_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4729 //EMIT_COND_SYSTEM_EXCEPTION_FLAGS (PPC_BR_TRUE, PPC_BR_EQ, "OverflowException");
4733 ARM_SUBS_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4736 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4737 g_assert (imm8 >= 0);
4738 ARM_SUBS_REG_IMM (code, ins->dreg, ins->sreg1, imm8, rot_amount);
4741 ARM_SUB_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4745 ARM_SBCS_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4749 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4750 g_assert (imm8 >= 0);
4751 ARM_SUB_REG_IMM (code, ins->dreg, ins->sreg1, imm8, rot_amount);
4755 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4756 g_assert (imm8 >= 0);
4757 ARM_SBCS_REG_IMM (code, ins->dreg, ins->sreg1, imm8, rot_amount);
4759 case OP_ARM_RSBS_IMM:
4760 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4761 g_assert (imm8 >= 0);
4762 ARM_RSBS_REG_IMM (code, ins->dreg, ins->sreg1, imm8, rot_amount);
4764 case OP_ARM_RSC_IMM:
4765 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4766 g_assert (imm8 >= 0);
4767 ARM_RSC_REG_IMM (code, ins->dreg, ins->sreg1, imm8, rot_amount);
4770 ARM_AND_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4774 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4775 g_assert (imm8 >= 0);
4776 ARM_AND_REG_IMM (code, ins->dreg, ins->sreg1, imm8, rot_amount);
4779 g_assert (v7s_supported || v7k_supported);
4780 ARM_SDIV (code, ins->dreg, ins->sreg1, ins->sreg2);
4783 g_assert (v7s_supported || v7k_supported);
4784 ARM_UDIV (code, ins->dreg, ins->sreg1, ins->sreg2);
4787 g_assert (v7s_supported || v7k_supported);
4788 ARM_SDIV (code, ARMREG_LR, ins->sreg1, ins->sreg2);
4789 ARM_MLS (code, ins->dreg, ARMREG_LR, ins->sreg2, ins->sreg1);
4792 g_assert (v7s_supported || v7k_supported);
4793 ARM_UDIV (code, ARMREG_LR, ins->sreg1, ins->sreg2);
4794 ARM_MLS (code, ins->dreg, ARMREG_LR, ins->sreg2, ins->sreg1);
4798 g_assert_not_reached ();
4800 ARM_ORR_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4804 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4805 g_assert (imm8 >= 0);
4806 ARM_ORR_REG_IMM (code, ins->dreg, ins->sreg1, imm8, rot_amount);
4809 ARM_EOR_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4813 imm8 = mono_arm_is_rotated_imm8 (ins->inst_imm, &rot_amount);
4814 g_assert (imm8 >= 0);
4815 ARM_EOR_REG_IMM (code, ins->dreg, ins->sreg1, imm8, rot_amount);
4818 ARM_SHL_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4823 ARM_SHL_IMM (code, ins->dreg, ins->sreg1, (ins->inst_imm & 0x1f));
4824 else if (ins->dreg != ins->sreg1)
4825 ARM_MOV_REG_REG (code, ins->dreg, ins->sreg1);
4828 ARM_SAR_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4833 ARM_SAR_IMM (code, ins->dreg, ins->sreg1, (ins->inst_imm & 0x1f));
4834 else if (ins->dreg != ins->sreg1)
4835 ARM_MOV_REG_REG (code, ins->dreg, ins->sreg1);
4838 case OP_ISHR_UN_IMM:
4840 ARM_SHR_IMM (code, ins->dreg, ins->sreg1, (ins->inst_imm & 0x1f));
4841 else if (ins->dreg != ins->sreg1)
4842 ARM_MOV_REG_REG (code, ins->dreg, ins->sreg1);
4845 ARM_SHR_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4848 ARM_MVN_REG_REG (code, ins->dreg, ins->sreg1);
4851 ARM_RSB_REG_IMM8 (code, ins->dreg, ins->sreg1, 0);
4854 if (ins->dreg == ins->sreg2)
4855 ARM_MUL_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4857 ARM_MUL_REG_REG (code, ins->dreg, ins->sreg2, ins->sreg1);
4860 g_assert_not_reached ();
4863 /* FIXME: handle ovf/ sreg2 != dreg */
4864 ARM_MUL_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4865 /* FIXME: MUL doesn't set the C/O flags on ARM */
4867 case OP_IMUL_OVF_UN:
4868 /* FIXME: handle ovf/ sreg2 != dreg */
4869 ARM_MUL_REG_REG (code, ins->dreg, ins->sreg1, ins->sreg2);
4870 /* FIXME: MUL doesn't set the C/O flags on ARM */
4873 code = mono_arm_emit_load_imm (code, ins->dreg, ins->inst_c0);
4876 /* Load the GOT offset */
4877 mono_add_patch_info (cfg, offset, (MonoJumpInfoType)ins->inst_i1, ins->inst_p0);
4878 ARM_LDR_IMM (code, ins->dreg, ARMREG_PC, 0);
4880 *(gpointer*)code = NULL;
4882 /* Load the value from the GOT */
4883 ARM_LDR_REG_REG (code, ins->dreg, ARMREG_PC, ins->dreg);
4885 case OP_OBJC_GET_SELECTOR:
4886 mono_add_patch_info (cfg, offset, MONO_PATCH_INFO_OBJC_SELECTOR_REF, ins->inst_p0);
4887 ARM_LDR_IMM (code, ins->dreg, ARMREG_PC, 0);
4889 *(gpointer*)code = NULL;
4891 ARM_LDR_REG_REG (code, ins->dreg, ARMREG_PC, ins->dreg);
4893 case OP_ICONV_TO_I4:
4894 case OP_ICONV_TO_U4:
4896 if (ins->dreg != ins->sreg1)
4897 ARM_MOV_REG_REG (code, ins->dreg, ins->sreg1);
4900 int saved = ins->sreg2;
4901 if (ins->sreg2 == ARM_LSW_REG) {
4902 ARM_MOV_REG_REG (code, ARMREG_LR, ins->sreg2);
4905 if (ins->sreg1 != ARM_LSW_REG)
4906 ARM_MOV_REG_REG (code, ARM_LSW_REG, ins->sreg1);
4907 if (saved != ARM_MSW_REG)
4908 ARM_MOV_REG_REG (code, ARM_MSW_REG, saved);
4912 if (IS_VFP && ins->dreg != ins->sreg1)
4913 ARM_CPYD (code, ins->dreg, ins->sreg1);
4916 if (IS_VFP && ins->dreg != ins->sreg1)
4917 ARM_CPYS (code, ins->dreg, ins->sreg1);
4919 case OP_MOVE_F_TO_I4:
4921 ARM_FMRS (code, ins->dreg, ins->sreg1);
4923 code = mono_arm_emit_vfp_scratch_save (cfg, code, vfp_scratch1);
4924 ARM_CVTD (code, vfp_scratch1, ins->sreg1);
4925 ARM_FMRS (code, ins->dreg, vfp_scratch1);
4926 code = mono_arm_emit_vfp_scratch_restore (cfg, code, vfp_scratch1);
4929 case OP_MOVE_I4_TO_F:
4931 ARM_FMSR (code, ins->dreg, ins->sreg1);
4933 ARM_FMSR (code, ins->dreg, ins->sreg1);
4934 ARM_CVTS (code, ins->dreg, ins->dreg);
4937 case OP_FCONV_TO_R4:
4940 ARM_CVTD (code, ins->dreg, ins->sreg1);
4942 ARM_CVTD (code, ins->dreg, ins->sreg1);
4943 ARM_CVTS (code, ins->dreg, ins->dreg);
4948 MonoCallInst *call = (MonoCallInst*)ins;
4951 * The stack looks like the following:
4952 * <caller argument area>
4955 * <callee argument area>
4956 * Need to copy the arguments from the callee argument area to
4957 * the caller argument area, and pop the frame.
4959 if (call->stack_usage) {
4960 int i, prev_sp_offset = 0;
4962 /* Compute size of saved registers restored below */
4964 prev_sp_offset = 2 * 4;
4966 prev_sp_offset = 1 * 4;
4967 for (i = 0; i < 16; ++i) {
4968 if (cfg->used_int_regs & (1 << i))
4969 prev_sp_offset += 4;
4972 code = emit_big_add (code, ARMREG_IP, cfg->frame_reg, cfg->stack_usage + prev_sp_offset);
4974 /* Copy arguments on the stack to our argument area */
4975 for (i = 0; i < call->stack_usage; i += sizeof (mgreg_t)) {
4976 ARM_LDR_IMM (code, ARMREG_LR, ARMREG_SP, i);
4977 ARM_STR_IMM (code, ARMREG_LR, ARMREG_IP, i);
4982 * Keep in sync with mono_arch_emit_epilog
4984 g_assert (!cfg->method->save_lmf);
4986 code = emit_big_add (code, ARMREG_SP, cfg->frame_reg, cfg->stack_usage);
4988 if (cfg->used_int_regs)
4989 ARM_POP (code, cfg->used_int_regs);
4990 ARM_POP (code, (1 << ARMREG_R7) | (1 << ARMREG_LR));
4992 ARM_POP (code, cfg->used_int_regs | (1 << ARMREG_LR));
4995 mono_add_patch_info (cfg, (guint8*) code - cfg->native_code, MONO_PATCH_INFO_METHOD_JUMP, call->method);
4996 if (cfg->compile_aot) {
4997 ARM_LDR_IMM (code, ARMREG_IP, ARMREG_PC, 0);
4999 *(gpointer*)code = NULL;
5001 ARM_LDR_REG_REG (code, ARMREG_PC, ARMREG_PC, ARMREG_IP);
5003 code = mono_arm_patchable_b (code, ARMCOND_AL);
5004 cfg->thunk_area += THUNK_SIZE;
5009 /* ensure ins->sreg1 is not NULL */
5010 ARM_LDRB_IMM (code, ARMREG_LR, ins->sreg1, 0);
5013 g_assert (cfg->sig_cookie < 128);
5014 ARM_LDR_IMM (code, ARMREG_IP, cfg->frame_reg, cfg->sig_cookie);
5015 ARM_STR_IMM (code, ARMREG_IP, ins->sreg1, 0);
5025 call = (MonoCallInst*)ins;
5028 code = emit_float_args (cfg, call, code, &max_len, &offset);
5030 if (ins->flags & MONO_INST_HAS_METHOD)
5031 mono_add_patch_info (cfg, offset, MONO_PATCH_INFO_METHOD, call->method);
5033 mono_add_patch_info (cfg, offset, MONO_PATCH_INFO_ABS, call->fptr);
5034 code = emit_call_seq (cfg, code);
5035 ins->flags |= MONO_INST_GC_CALLSITE;
5036 ins->backend.pc_offset = code - cfg->native_code;
5037 code = emit_move_return_value (cfg, ins, code);
5044 case OP_VOIDCALL_REG:
5047 code = emit_float_args (cfg, (MonoCallInst *)ins, code, &max_len, &offset);
5049 code = emit_call_reg (code, ins->sreg1);
5050 ins->flags |= MONO_INST_GC_CALLSITE;
5051 ins->backend.pc_offset = code - cfg->native_code;
5052 code = emit_move_return_value (cfg, ins, code);
5054 case OP_FCALL_MEMBASE:
5055 case OP_RCALL_MEMBASE:
5056 case OP_LCALL_MEMBASE:
5057 case OP_VCALL_MEMBASE:
5058 case OP_VCALL2_MEMBASE:
5059 case OP_VOIDCALL_MEMBASE:
5060 case OP_CALL_MEMBASE: {
5061 g_assert (ins->sreg1 != ARMREG_LR);
5062 call = (MonoCallInst*)ins;
5065 code = emit_float_args (cfg, call, code, &max_len, &offset);
5066 if (!arm_is_imm12 (ins->inst_offset)) {
5067 /* sreg1 might be IP */
5068 ARM_MOV_REG_REG (code, ARMREG_LR, ins->sreg1);
5069 code = mono_arm_emit_load_imm (code, ARMREG_IP, ins->inst_offset);
5070 ARM_ADD_REG_REG (code, ARMREG_IP, ARMREG_IP, ARMREG_LR);
5071 ARM_MOV_REG_REG (code, ARMREG_LR, ARMREG_PC);
5072 ARM_LDR_IMM (code, ARMREG_PC, ARMREG_IP, 0);
5074 ARM_MOV_REG_REG (code, ARMREG_LR, ARMREG_PC);
5075 ARM_LDR_IMM (code, ARMREG_PC, ins->sreg1, ins->inst_offset);
5077 ins->flags |= MONO_INST_GC_CALLSITE;
5078 ins->backend.pc_offset = code - cfg->native_code;
5079 code = emit_move_return_value (cfg, ins, code);
5082 case OP_GENERIC_CLASS_INIT: {
5086 byte_offset = MONO_STRUCT_OFFSET (MonoVTable, initialized);
5088 g_assert (arm_is_imm8 (byte_offset));
5089 ARM_LDRSB_IMM (code, ARMREG_IP, ins->sreg1, byte_offset);
5090 ARM_CMP_REG_IMM (code, ARMREG_IP, 0, 0);
5092 ARM_B_COND (code, ARMCOND_NE, 0);
5094 /* Uninitialized case */
5095 g_assert (ins->sreg1 == ARMREG_R0);
5097 mono_add_patch_info (cfg, code - cfg->native_code, MONO_PATCH_INFO_INTERNAL_METHOD,
5098 (gpointer)"mono_generic_class_init");
5099 code = emit_call_seq (cfg, code);
5101 /* Initialized case */
5102 arm_patch (jump, code);
5106 /* round the size to 8 bytes */
5107 ARM_ADD_REG_IMM8 (code, ins->dreg, ins->sreg1, (MONO_ARCH_FRAME_ALIGNMENT - 1));
5108 ARM_BIC_REG_IMM8 (code, ins->dreg, ins->dreg, (MONO_ARCH_FRAME_ALIGNMENT - 1));
5109 ARM_SUB_REG_REG (code, ARMREG_SP, ARMREG_SP, ins->dreg);
5110 /* memzero the area: dreg holds the size, sp is the pointer */
5111 if (ins->flags & MONO_INST_INIT) {
5112 guint8 *start_loop, *branch_to_cond;
5113 ARM_MOV_REG_IMM8 (code, ARMREG_LR, 0);
5114 branch_to_cond = code;
5117 ARM_STR_REG_REG (code, ARMREG_LR, ARMREG_SP, ins->dreg);
5118 arm_patch (branch_to_cond, code);
5119 /* decrement by 4 and set flags */
5120 ARM_SUBS_REG_IMM8 (code, ins->dreg, ins->dreg, sizeof (mgreg_t));
5121 ARM_B_COND (code, ARMCOND_GE, 0);
5122 arm_patch (code - 4, start_loop);
5124 ARM_MOV_REG_REG (code, ins->dreg, ARMREG_SP);
5125 if (cfg->param_area)
5126 code = emit_sub_imm (code, ARMREG_SP, ARMREG_SP, ALIGN_TO (cfg->param_area, MONO_ARCH_FRAME_ALIGNMENT));
5131 MonoInst *var = cfg->dyn_call_var;
5134 g_assert (var->opcode == OP_REGOFFSET);
5135 g_assert (arm_is_imm12 (var->inst_offset));
5137 /* lr = args buffer filled by mono_arch_get_dyn_call_args () */
5138 ARM_MOV_REG_REG (code, ARMREG_LR, ins->sreg1);
5140 ARM_MOV_REG_REG (code, ARMREG_IP, ins->sreg2);
5142 /* Save args buffer */
5143 ARM_STR_IMM (code, ARMREG_LR, var->inst_basereg, var->inst_offset);
5145 /* Set stack slots using R0 as scratch reg */
5146 /* MONO_ARCH_DYN_CALL_PARAM_AREA gives the size of stack space available */
5147 for (i = 0; i < DYN_CALL_STACK_ARGS; ++i) {
5148 ARM_LDR_IMM (code, ARMREG_R0, ARMREG_LR, (PARAM_REGS + i) * sizeof (mgreg_t));
5149 ARM_STR_IMM (code, ARMREG_R0, ARMREG_SP, i * sizeof (mgreg_t));
5152 /* Set fp argument registers */
5153 if (IS_HARD_FLOAT) {
5154 ARM_LDR_IMM (code, ARMREG_R0, ARMREG_LR, MONO_STRUCT_OFFSET (DynCallArgs, has_fpregs));
5155 ARM_CMP_REG_IMM (code, ARMREG_R0, 0, 0);
5157 ARM_B_COND (code, ARMCOND_EQ, 0);
5158 for (i = 0; i < FP_PARAM_REGS; ++i) {
5159 int offset = MONO_STRUCT_OFFSET (DynCallArgs, fpregs) + (i * sizeof (double));
5160 g_assert (arm_is_fpimm8 (offset));
5161 ARM_FLDD (code, i * 2, ARMREG_LR, offset);
5163 arm_patch (buf [0], code);
5166 /* Set argument registers */
5167 for (i = 0; i < PARAM_REGS; ++i)
5168 ARM_LDR_IMM (code, i, ARMREG_LR, i * sizeof (mgreg_t));
5171 ARM_MOV_REG_REG (code, ARMREG_LR, ARMREG_PC);
5172 ARM_MOV_REG_REG (code, ARMREG_PC, ARMREG_IP);
5175 ARM_LDR_IMM (code, ARMREG_IP, var->inst_basereg, var->inst_offset);
5176 ARM_STR_IMM (code, ARMREG_R0, ARMREG_IP, MONO_STRUCT_OFFSET (DynCallArgs, res));
5177 ARM_STR_IMM (code, ARMREG_R1, ARMREG_IP, MONO_STRUCT_OFFSET (DynCallArgs, res2));
5179 ARM_FSTD (code, ARM_VFP_D0, ARMREG_IP, MONO_STRUCT_OFFSET (DynCallArgs, fpregs));
5183 if (ins->sreg1 != ARMREG_R0)
5184 ARM_MOV_REG_REG (code, ARMREG_R0, ins->sreg1);
5185 mono_add_patch_info (cfg, code - cfg->native_code, MONO_PATCH_INFO_INTERNAL_METHOD,
5186 (gpointer)"mono_arch_throw_exception");
5187 code = emit_call_seq (cfg, code);
5191 if (ins->sreg1 != ARMREG_R0)
5192 ARM_MOV_REG_REG (code, ARMREG_R0, ins->sreg1);
5193 mono_add_patch_info (cfg, code - cfg->native_code, MONO_PATCH_INFO_INTERNAL_METHOD,
5194 (gpointer)"mono_arch_rethrow_exception");
5195 code = emit_call_seq (cfg, code);
5198 case OP_START_HANDLER: {
5199 MonoInst *spvar = mono_find_spvar_for_region (cfg, bb->region);
5200 int param_area = ALIGN_TO (cfg->param_area, MONO_ARCH_FRAME_ALIGNMENT);
5203 /* Reserve a param area, see filter-stack.exe */
5205 if ((i = mono_arm_is_rotated_imm8 (param_area, &rot_amount)) >= 0) {
5206 ARM_SUB_REG_IMM (code, ARMREG_SP, ARMREG_SP, i, rot_amount);
5208 code = mono_arm_emit_load_imm (code, ARMREG_IP, param_area);
5209 ARM_SUB_REG_REG (code, ARMREG_SP, ARMREG_SP, ARMREG_IP);
5213 if (arm_is_imm12 (spvar->inst_offset)) {
5214 ARM_STR_IMM (code, ARMREG_LR, spvar->inst_basereg, spvar->inst_offset);
5216 code = mono_arm_emit_load_imm (code, ARMREG_IP, spvar->inst_offset);
5217 ARM_STR_REG_REG (code, ARMREG_LR, spvar->inst_basereg, ARMREG_IP);
5221 case OP_ENDFILTER: {
5222 MonoInst *spvar = mono_find_spvar_for_region (cfg, bb->region);
5223 int param_area = ALIGN_TO (cfg->param_area, MONO_ARCH_FRAME_ALIGNMENT);
5226 /* Free the param area */
5228 if ((i = mono_arm_is_rotated_imm8 (param_area, &rot_amount)) >= 0) {
5229 ARM_ADD_REG_IMM (code, ARMREG_SP, ARMREG_SP, i, rot_amount);
5231 code = mono_arm_emit_load_imm (code, ARMREG_IP, param_area);
5232 ARM_ADD_REG_REG (code, ARMREG_SP, ARMREG_SP, ARMREG_IP);
5236 if (ins->sreg1 != ARMREG_R0)
5237 ARM_MOV_REG_REG (code, ARMREG_R0, ins->sreg1);
5238 if (arm_is_imm12 (spvar->inst_offset)) {
5239 ARM_LDR_IMM (code, ARMREG_IP, spvar->inst_basereg, spvar->inst_offset);
5241 g_assert (ARMREG_IP != spvar->inst_basereg);
5242 code = mono_arm_emit_load_imm (code, ARMREG_IP, spvar->inst_offset);
5243 ARM_LDR_REG_REG (code, ARMREG_IP, spvar->inst_basereg, ARMREG_IP);
5245 ARM_MOV_REG_REG (code, ARMREG_PC, ARMREG_IP);
5248 case OP_ENDFINALLY: {
5249 MonoInst *spvar = mono_find_spvar_for_region (cfg, bb->region);
5250 int param_area = ALIGN_TO (cfg->param_area, MONO_ARCH_FRAME_ALIGNMENT);
5253 /* Free the param area */
5255 if ((i = mono_arm_is_rotated_imm8 (param_area, &rot_amount)) >= 0) {
5256 ARM_ADD_REG_IMM (code, ARMREG_SP, ARMREG_SP, i, rot_amount);
5258 code = mono_arm_emit_load_imm (code, ARMREG_IP, param_area);
5259 ARM_ADD_REG_REG (code, ARMREG_SP, ARMREG_SP, ARMREG_IP);
5263 if (arm_is_imm12 (spvar->inst_offset)) {
5264 ARM_LDR_IMM (code, ARMREG_IP, spvar->inst_basereg, spvar->inst_offset);
5266 g_assert (ARMREG_IP != spvar->inst_basereg);
5267 code = mono_arm_emit_load_imm (code, ARMREG_IP, spvar->inst_offset);
5268 ARM_LDR_REG_REG (code, ARMREG_IP, spvar->inst_basereg, ARMREG_IP);
5270 ARM_MOV_REG_REG (code, ARMREG_PC, ARMREG_IP);
5273 case OP_CALL_HANDLER:
5274 mono_add_patch_info (cfg, code - cfg->native_code, MONO_PATCH_INFO_BB, ins->inst_target_bb);
5275 code = mono_arm_patchable_bl (code, ARMCOND_AL);
5276 cfg->thunk_area += THUNK_SIZE;
5277 mono_cfg_add_try_hole (cfg, ins->inst_eh_block, code, bb);
5280 if (ins->dreg != ARMREG_R0)
5281 ARM_MOV_REG_REG (code, ins->dreg, ARMREG_R0);
5285 ins->inst_c0 = code - cfg->native_code;
5288 /*if (ins->inst_target_bb->native_offset) {
5290 //x86_jump_code (code, cfg->native_code + ins->inst_target_bb->native_offset);
5292 mono_add_patch_info (cfg, offset, MONO_PATCH_INFO_BB, ins->inst_target_bb);
5293 code = mono_arm_patchable_b (code, ARMCOND_AL);
5297 ARM_MOV_REG_REG (code, ARMREG_PC, ins->sreg1);
5301 * In the normal case we have:
5302 * ldr pc, [pc, ins->sreg1 << 2]
5305 * ldr lr, [pc, ins->sreg1 << 2]
5307 * After follows the data.
5308 * FIXME: add aot support.
5310 mono_add_patch_info (cfg, offset, MONO_PATCH_INFO_SWITCH, ins->inst_p0);
5311 max_len += 4 * GPOINTER_TO_INT (ins->klass);
5312 if (offset + max_len > (cfg->code_size - 16)) {
5313 cfg->code_size += max_len;
5314 cfg->code_size *= 2;
5315 cfg->native_code = g_realloc (cfg->native_code, cfg->code_size);
5316 code = cfg->native_code + offset;
5318 ARM_LDR_REG_REG_SHIFT (code, ARMREG_PC, ARMREG_PC, ins->sreg1, ARMSHIFT_LSL, 2);
5320 code += 4 * GPOINTER_TO_INT (ins->klass);
5324 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_NE);
5325 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_EQ);
5329 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5330 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_LT);
5334 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5335 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_LO);
5339 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5340 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_GT);
5344 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5345 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_HI);
5348 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_NE);
5349 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_EQ);
5352 ARM_MOV_REG_IMM8 (code, ins->dreg, 1);
5353 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_LT);
5356 ARM_MOV_REG_IMM8 (code, ins->dreg, 1);
5357 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_GT);
5360 ARM_MOV_REG_IMM8 (code, ins->dreg, 1);
5361 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_LO);
5364 ARM_MOV_REG_IMM8 (code, ins->dreg, 1);
5365 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_HI);
5367 case OP_COND_EXC_EQ:
5368 case OP_COND_EXC_NE_UN:
5369 case OP_COND_EXC_LT:
5370 case OP_COND_EXC_LT_UN:
5371 case OP_COND_EXC_GT:
5372 case OP_COND_EXC_GT_UN:
5373 case OP_COND_EXC_GE:
5374 case OP_COND_EXC_GE_UN:
5375 case OP_COND_EXC_LE:
5376 case OP_COND_EXC_LE_UN:
5377 EMIT_COND_SYSTEM_EXCEPTION (ins->opcode - OP_COND_EXC_EQ, ins->inst_p1);
5379 case OP_COND_EXC_IEQ:
5380 case OP_COND_EXC_INE_UN:
5381 case OP_COND_EXC_ILT:
5382 case OP_COND_EXC_ILT_UN:
5383 case OP_COND_EXC_IGT:
5384 case OP_COND_EXC_IGT_UN:
5385 case OP_COND_EXC_IGE:
5386 case OP_COND_EXC_IGE_UN:
5387 case OP_COND_EXC_ILE:
5388 case OP_COND_EXC_ILE_UN:
5389 EMIT_COND_SYSTEM_EXCEPTION (ins->opcode - OP_COND_EXC_IEQ, ins->inst_p1);
5392 case OP_COND_EXC_IC:
5393 EMIT_COND_SYSTEM_EXCEPTION_FLAGS (ARMCOND_CS, ins->inst_p1);
5395 case OP_COND_EXC_OV:
5396 case OP_COND_EXC_IOV:
5397 EMIT_COND_SYSTEM_EXCEPTION_FLAGS (ARMCOND_VS, ins->inst_p1);
5399 case OP_COND_EXC_NC:
5400 case OP_COND_EXC_INC:
5401 EMIT_COND_SYSTEM_EXCEPTION_FLAGS (ARMCOND_CC, ins->inst_p1);
5403 case OP_COND_EXC_NO:
5404 case OP_COND_EXC_INO:
5405 EMIT_COND_SYSTEM_EXCEPTION_FLAGS (ARMCOND_VC, ins->inst_p1);
5417 EMIT_COND_BRANCH (ins, ins->opcode - OP_IBEQ);
5420 /* floating point opcodes */
5422 if (cfg->compile_aot) {
5423 ARM_FLDD (code, ins->dreg, ARMREG_PC, 0);
5425 *(guint32*)code = ((guint32*)(ins->inst_p0))[0];
5427 *(guint32*)code = ((guint32*)(ins->inst_p0))[1];
5430 /* FIXME: we can optimize the imm load by dealing with part of
5431 * the displacement in LDFD (aligning to 512).
5433 code = mono_arm_emit_load_imm (code, ARMREG_LR, (guint32)ins->inst_p0);
5434 ARM_FLDD (code, ins->dreg, ARMREG_LR, 0);
5438 if (cfg->compile_aot) {
5439 ARM_FLDS (code, ins->dreg, ARMREG_PC, 0);
5441 *(guint32*)code = ((guint32*)(ins->inst_p0))[0];
5444 ARM_CVTS (code, ins->dreg, ins->dreg);
5446 code = mono_arm_emit_load_imm (code, ARMREG_LR, (guint32)ins->inst_p0);
5447 ARM_FLDS (code, ins->dreg, ARMREG_LR, 0);
5449 ARM_CVTS (code, ins->dreg, ins->dreg);
5452 case OP_STORER8_MEMBASE_REG:
5453 /* This is generated by the local regalloc pass which runs after the lowering pass */
5454 if (!arm_is_fpimm8 (ins->inst_offset)) {
5455 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_offset);
5456 ARM_ADD_REG_REG (code, ARMREG_LR, ARMREG_LR, ins->inst_destbasereg);
5457 ARM_FSTD (code, ins->sreg1, ARMREG_LR, 0);
5459 ARM_FSTD (code, ins->sreg1, ins->inst_destbasereg, ins->inst_offset);
5462 case OP_LOADR8_MEMBASE:
5463 /* This is generated by the local regalloc pass which runs after the lowering pass */
5464 if (!arm_is_fpimm8 (ins->inst_offset)) {
5465 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_offset);
5466 ARM_ADD_REG_REG (code, ARMREG_LR, ARMREG_LR, ins->inst_basereg);
5467 ARM_FLDD (code, ins->dreg, ARMREG_LR, 0);
5469 ARM_FLDD (code, ins->dreg, ins->inst_basereg, ins->inst_offset);
5472 case OP_STORER4_MEMBASE_REG:
5473 g_assert (arm_is_fpimm8 (ins->inst_offset));
5475 ARM_FSTS (code, ins->sreg1, ins->inst_destbasereg, ins->inst_offset);
5477 code = mono_arm_emit_vfp_scratch_save (cfg, code, vfp_scratch1);
5478 ARM_CVTD (code, vfp_scratch1, ins->sreg1);
5479 ARM_FSTS (code, vfp_scratch1, ins->inst_destbasereg, ins->inst_offset);
5480 code = mono_arm_emit_vfp_scratch_restore (cfg, code, vfp_scratch1);
5483 case OP_LOADR4_MEMBASE:
5485 ARM_FLDS (code, ins->dreg, ins->inst_basereg, ins->inst_offset);
5487 g_assert (arm_is_fpimm8 (ins->inst_offset));
5488 code = mono_arm_emit_vfp_scratch_save (cfg, code, vfp_scratch1);
5489 ARM_FLDS (code, vfp_scratch1, ins->inst_basereg, ins->inst_offset);
5490 ARM_CVTS (code, ins->dreg, vfp_scratch1);
5491 code = mono_arm_emit_vfp_scratch_restore (cfg, code, vfp_scratch1);
5494 case OP_ICONV_TO_R_UN: {
5495 g_assert_not_reached ();
5498 case OP_ICONV_TO_R4:
5500 ARM_FMSR (code, ins->dreg, ins->sreg1);
5501 ARM_FSITOS (code, ins->dreg, ins->dreg);
5503 code = mono_arm_emit_vfp_scratch_save (cfg, code, vfp_scratch1);
5504 ARM_FMSR (code, vfp_scratch1, ins->sreg1);
5505 ARM_FSITOS (code, vfp_scratch1, vfp_scratch1);
5506 ARM_CVTS (code, ins->dreg, vfp_scratch1);
5507 code = mono_arm_emit_vfp_scratch_restore (cfg, code, vfp_scratch1);
5510 case OP_ICONV_TO_R8:
5511 code = mono_arm_emit_vfp_scratch_save (cfg, code, vfp_scratch1);
5512 ARM_FMSR (code, vfp_scratch1, ins->sreg1);
5513 ARM_FSITOD (code, ins->dreg, vfp_scratch1);
5514 code = mono_arm_emit_vfp_scratch_restore (cfg, code, vfp_scratch1);
5518 MonoType *sig_ret = mini_get_underlying_type (mono_method_signature (cfg->method)->ret);
5519 if (sig_ret->type == MONO_TYPE_R4) {
5521 if (IS_HARD_FLOAT) {
5522 if (ins->sreg1 != ARM_VFP_D0)
5523 ARM_CPYS (code, ARM_VFP_D0, ins->sreg1);
5525 ARM_FMRS (code, ARMREG_R0, ins->sreg1);
5528 ARM_CVTD (code, ARM_VFP_F0, ins->sreg1);
5531 ARM_FMRS (code, ARMREG_R0, ARM_VFP_F0);
5535 ARM_CPYD (code, ARM_VFP_D0, ins->sreg1);
5537 ARM_FMRRD (code, ARMREG_R0, ARMREG_R1, ins->sreg1);
5541 case OP_FCONV_TO_I1:
5542 code = emit_float_to_int (cfg, code, ins->dreg, ins->sreg1, 1, TRUE);
5544 case OP_FCONV_TO_U1:
5545 code = emit_float_to_int (cfg, code, ins->dreg, ins->sreg1, 1, FALSE);
5547 case OP_FCONV_TO_I2:
5548 code = emit_float_to_int (cfg, code, ins->dreg, ins->sreg1, 2, TRUE);
5550 case OP_FCONV_TO_U2:
5551 code = emit_float_to_int (cfg, code, ins->dreg, ins->sreg1, 2, FALSE);
5553 case OP_FCONV_TO_I4:
5555 code = emit_float_to_int (cfg, code, ins->dreg, ins->sreg1, 4, TRUE);
5557 case OP_FCONV_TO_U4:
5559 code = emit_float_to_int (cfg, code, ins->dreg, ins->sreg1, 4, FALSE);
5561 case OP_FCONV_TO_I8:
5562 case OP_FCONV_TO_U8:
5563 g_assert_not_reached ();
5564 /* Implemented as helper calls */
5566 case OP_LCONV_TO_R_UN:
5567 g_assert_not_reached ();
5568 /* Implemented as helper calls */
5570 case OP_LCONV_TO_OVF_I4_2: {
5571 guint8 *high_bit_not_set, *valid_negative, *invalid_negative, *valid_positive;
5573 * Valid ints: 0xffffffff:8000000 to 00000000:0x7f000000
5576 ARM_CMP_REG_IMM8 (code, ins->sreg1, 0);
5577 high_bit_not_set = code;
5578 ARM_B_COND (code, ARMCOND_GE, 0); /*branch if bit 31 of the lower part is not set*/
5580 ARM_CMN_REG_IMM8 (code, ins->sreg2, 1); /*This have the same effect as CMP reg, 0xFFFFFFFF */
5581 valid_negative = code;
5582 ARM_B_COND (code, ARMCOND_EQ, 0); /*branch if upper part == 0xFFFFFFFF (lower part has bit 31 set) */
5583 invalid_negative = code;
5584 ARM_B_COND (code, ARMCOND_AL, 0);
5586 arm_patch (high_bit_not_set, code);
5588 ARM_CMP_REG_IMM8 (code, ins->sreg2, 0);
5589 valid_positive = code;
5590 ARM_B_COND (code, ARMCOND_EQ, 0); /*branch if upper part == 0 (lower part has bit 31 clear)*/
5592 arm_patch (invalid_negative, code);
5593 EMIT_COND_SYSTEM_EXCEPTION_FLAGS (ARMCOND_AL, "OverflowException");
5595 arm_patch (valid_negative, code);
5596 arm_patch (valid_positive, code);
5598 if (ins->dreg != ins->sreg1)
5599 ARM_MOV_REG_REG (code, ins->dreg, ins->sreg1);
5603 ARM_VFP_ADDD (code, ins->dreg, ins->sreg1, ins->sreg2);
5606 ARM_VFP_SUBD (code, ins->dreg, ins->sreg1, ins->sreg2);
5609 ARM_VFP_MULD (code, ins->dreg, ins->sreg1, ins->sreg2);
5612 ARM_VFP_DIVD (code, ins->dreg, ins->sreg1, ins->sreg2);
5615 ARM_NEGD (code, ins->dreg, ins->sreg1);
5619 g_assert_not_reached ();
5623 ARM_CMPD (code, ins->sreg1, ins->sreg2);
5629 ARM_CMPS (code, ins->sreg1, ins->sreg2);
5634 ARM_CMPD (code, ins->sreg1, ins->sreg2);
5637 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_NE);
5638 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_EQ);
5642 ARM_CMPD (code, ins->sreg1, ins->sreg2);
5645 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5646 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_MI);
5650 ARM_CMPD (code, ins->sreg1, ins->sreg2);
5653 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5654 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_MI);
5655 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_VS);
5659 ARM_CMPD (code, ins->sreg2, ins->sreg1);
5662 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5663 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_MI);
5667 ARM_CMPD (code, ins->sreg2, ins->sreg1);
5670 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5671 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_MI);
5672 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_VS);
5676 ARM_CMPD (code, ins->sreg1, ins->sreg2);
5679 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_NE);
5680 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_EQ);
5684 ARM_CMPD (code, ins->sreg1, ins->sreg2);
5687 ARM_MOV_REG_IMM8 (code, ins->dreg, 1);
5688 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_MI);
5692 ARM_CMPD (code, ins->sreg2, ins->sreg1);
5695 ARM_MOV_REG_IMM8 (code, ins->dreg, 1);
5696 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_MI);
5699 /* ARM FPA flags table:
5700 * N Less than ARMCOND_MI
5701 * Z Equal ARMCOND_EQ
5702 * C Greater Than or Equal ARMCOND_CS
5703 * V Unordered ARMCOND_VS
5706 EMIT_COND_BRANCH (ins, OP_IBEQ - OP_IBEQ);
5709 EMIT_COND_BRANCH (ins, OP_IBNE_UN - OP_IBEQ);
5712 EMIT_COND_BRANCH_FLAGS (ins, ARMCOND_MI); /* N set */
5715 EMIT_COND_BRANCH_FLAGS (ins, ARMCOND_VS); /* V set */
5716 EMIT_COND_BRANCH_FLAGS (ins, ARMCOND_MI); /* N set */
5722 g_assert_not_reached ();
5726 EMIT_COND_BRANCH_FLAGS (ins, ARMCOND_GE);
5728 /* FPA requires EQ even thou the docs suggests that just CS is enough */
5729 EMIT_COND_BRANCH_FLAGS (ins, ARMCOND_EQ);
5730 EMIT_COND_BRANCH_FLAGS (ins, ARMCOND_CS);
5734 EMIT_COND_BRANCH_FLAGS (ins, ARMCOND_VS); /* V set */
5735 EMIT_COND_BRANCH_FLAGS (ins, ARMCOND_GE);
5740 code = mono_arm_emit_vfp_scratch_save (cfg, code, vfp_scratch1);
5741 code = mono_arm_emit_vfp_scratch_save (cfg, code, vfp_scratch2);
5743 ARM_ABSD (code, vfp_scratch2, ins->sreg1);
5744 ARM_FLDD (code, vfp_scratch1, ARMREG_PC, 0);
5746 *(guint32*)code = 0xffffffff;
5748 *(guint32*)code = 0x7fefffff;
5750 ARM_CMPD (code, vfp_scratch2, vfp_scratch1);
5752 EMIT_COND_SYSTEM_EXCEPTION_FLAGS (ARMCOND_GT, "OverflowException");
5753 ARM_CMPD (code, ins->sreg1, ins->sreg1);
5755 EMIT_COND_SYSTEM_EXCEPTION_FLAGS (ARMCOND_VS, "OverflowException");
5756 ARM_CPYD (code, ins->dreg, ins->sreg1);
5758 code = mono_arm_emit_vfp_scratch_restore (cfg, code, vfp_scratch1);
5759 code = mono_arm_emit_vfp_scratch_restore (cfg, code, vfp_scratch2);
5764 case OP_RCONV_TO_I1:
5765 code = emit_r4_to_int (cfg, code, ins->dreg, ins->sreg1, 1, TRUE);
5767 case OP_RCONV_TO_U1:
5768 code = emit_r4_to_int (cfg, code, ins->dreg, ins->sreg1, 1, FALSE);
5770 case OP_RCONV_TO_I2:
5771 code = emit_r4_to_int (cfg, code, ins->dreg, ins->sreg1, 2, TRUE);
5773 case OP_RCONV_TO_U2:
5774 code = emit_r4_to_int (cfg, code, ins->dreg, ins->sreg1, 2, FALSE);
5776 case OP_RCONV_TO_I4:
5777 code = emit_r4_to_int (cfg, code, ins->dreg, ins->sreg1, 4, TRUE);
5779 case OP_RCONV_TO_U4:
5780 code = emit_r4_to_int (cfg, code, ins->dreg, ins->sreg1, 4, FALSE);
5782 case OP_RCONV_TO_R4:
5784 if (ins->dreg != ins->sreg1)
5785 ARM_CPYS (code, ins->dreg, ins->sreg1);
5787 case OP_RCONV_TO_R8:
5789 ARM_CVTS (code, ins->dreg, ins->sreg1);
5792 ARM_VFP_ADDS (code, ins->dreg, ins->sreg1, ins->sreg2);
5795 ARM_VFP_SUBS (code, ins->dreg, ins->sreg1, ins->sreg2);
5798 ARM_VFP_MULS (code, ins->dreg, ins->sreg1, ins->sreg2);
5801 ARM_VFP_DIVS (code, ins->dreg, ins->sreg1, ins->sreg2);
5804 ARM_NEGS (code, ins->dreg, ins->sreg1);
5808 ARM_CMPS (code, ins->sreg1, ins->sreg2);
5811 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_NE);
5812 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_EQ);
5816 ARM_CMPS (code, ins->sreg1, ins->sreg2);
5819 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5820 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_MI);
5824 ARM_CMPS (code, ins->sreg1, ins->sreg2);
5827 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5828 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_MI);
5829 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_VS);
5833 ARM_CMPS (code, ins->sreg2, ins->sreg1);
5836 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5837 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_MI);
5841 ARM_CMPS (code, ins->sreg2, ins->sreg1);
5844 ARM_MOV_REG_IMM8 (code, ins->dreg, 0);
5845 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_MI);
5846 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_VS);
5850 ARM_CMPS (code, ins->sreg1, ins->sreg2);
5853 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 1, ARMCOND_NE);
5854 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_EQ);
5858 ARM_CMPS (code, ins->sreg1, ins->sreg2);
5861 ARM_MOV_REG_IMM8 (code, ins->dreg, 1);
5862 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_MI);
5866 ARM_CMPS (code, ins->sreg2, ins->sreg1);
5869 ARM_MOV_REG_IMM8 (code, ins->dreg, 1);
5870 ARM_MOV_REG_IMM8_COND (code, ins->dreg, 0, ARMCOND_MI);
5873 case OP_GC_LIVENESS_DEF:
5874 case OP_GC_LIVENESS_USE:
5875 case OP_GC_PARAM_SLOT_LIVENESS_DEF:
5876 ins->backend.pc_offset = code - cfg->native_code;
5878 case OP_GC_SPILL_SLOT_LIVENESS_DEF:
5879 ins->backend.pc_offset = code - cfg->native_code;
5880 bb->spill_slot_defs = g_slist_prepend_mempool (cfg->mempool, bb->spill_slot_defs, ins);
5882 case OP_GC_SAFE_POINT: {
5885 g_assert (mono_threads_is_coop_enabled ());
5887 ARM_LDR_IMM (code, ARMREG_IP, ins->sreg1, 0);
5888 ARM_CMP_REG_IMM (code, ARMREG_IP, 0, 0);
5890 ARM_B_COND (code, ARMCOND_EQ, 0);
5891 mono_add_patch_info (cfg, code - cfg->native_code, MONO_PATCH_INFO_INTERNAL_METHOD, "mono_threads_state_poll");
5892 code = emit_call_seq (cfg, code);
5893 arm_patch (buf [0], code);
5898 g_warning ("unknown opcode %s in %s()\n", mono_inst_name (ins->opcode), __FUNCTION__);
5899 g_assert_not_reached ();
5902 if ((cfg->opt & MONO_OPT_BRANCH) && ((code - cfg->native_code - offset) > max_len)) {
5903 g_warning ("wrong maximal instruction length of instruction %s (expected %d, got %d)",
5904 mono_inst_name (ins->opcode), max_len, code - cfg->native_code - offset);
5905 g_assert_not_reached ();
5911 last_offset = offset;
5914 cfg->code_len = code - cfg->native_code;
5917 #endif /* DISABLE_JIT */
5920 mono_arch_register_lowlevel_calls (void)
5922 /* The signature doesn't matter */
5923 mono_register_jit_icall (mono_arm_throw_exception, "mono_arm_throw_exception", mono_create_icall_signature ("void"), TRUE);
5924 mono_register_jit_icall (mono_arm_throw_exception_by_token, "mono_arm_throw_exception_by_token", mono_create_icall_signature ("void"), TRUE);
5925 mono_register_jit_icall (mono_arm_unaligned_stack, "mono_arm_unaligned_stack", mono_create_icall_signature ("void"), TRUE);
5928 #define patch_lis_ori(ip,val) do {\
5929 guint16 *__lis_ori = (guint16*)(ip); \
5930 __lis_ori [1] = (((guint32)(val)) >> 16) & 0xffff; \
5931 __lis_ori [3] = ((guint32)(val)) & 0xffff; \
5935 mono_arch_patch_code_new (MonoCompile *cfg, MonoDomain *domain, guint8 *code, MonoJumpInfo *ji, gpointer target)
5937 unsigned char *ip = ji->ip.i + code;
5939 if (ji->type == MONO_PATCH_INFO_SWITCH) {
5943 case MONO_PATCH_INFO_SWITCH: {
5944 gpointer *jt = (gpointer*)(ip + 8);
5946 /* jt is the inlined jump table, 2 instructions after ip
5947 * In the normal case we store the absolute addresses,
5948 * otherwise the displacements.
5950 for (i = 0; i < ji->data.table->table_size; i++)
5951 jt [i] = code + (int)ji->data.table->table [i];
5954 case MONO_PATCH_INFO_IP:
5955 g_assert_not_reached ();
5956 patch_lis_ori (ip, ip);
5958 case MONO_PATCH_INFO_METHOD_REL:
5959 g_assert_not_reached ();
5960 *((gpointer *)(ip)) = target;
5962 case MONO_PATCH_INFO_METHODCONST:
5963 case MONO_PATCH_INFO_CLASS:
5964 case MONO_PATCH_INFO_IMAGE:
5965 case MONO_PATCH_INFO_FIELD:
5966 case MONO_PATCH_INFO_VTABLE:
5967 case MONO_PATCH_INFO_IID:
5968 case MONO_PATCH_INFO_SFLDA:
5969 case MONO_PATCH_INFO_LDSTR:
5970 case MONO_PATCH_INFO_TYPE_FROM_HANDLE:
5971 case MONO_PATCH_INFO_LDTOKEN:
5972 g_assert_not_reached ();
5973 /* from OP_AOTCONST : lis + ori */
5974 patch_lis_ori (ip, target);
5976 case MONO_PATCH_INFO_R4:
5977 case MONO_PATCH_INFO_R8:
5978 g_assert_not_reached ();
5979 *((gconstpointer *)(ip + 2)) = target;
5981 case MONO_PATCH_INFO_EXC_NAME:
5982 g_assert_not_reached ();
5983 *((gconstpointer *)(ip + 1)) = target;
5985 case MONO_PATCH_INFO_NONE:
5986 case MONO_PATCH_INFO_BB_OVF:
5987 case MONO_PATCH_INFO_EXC_OVF:
5988 /* everything is dealt with at epilog output time */
5991 arm_patch_general (cfg, domain, ip, target);
5997 mono_arm_unaligned_stack (MonoMethod *method)
5999 g_assert_not_reached ();
6005 * Stack frame layout:
6007 * ------------------- fp
6008 * MonoLMF structure or saved registers
6009 * -------------------
6011 * -------------------
6013 * -------------------
6014 * optional 8 bytes for tracing
6015 * -------------------
6016 * param area size is cfg->param_area
6017 * ------------------- sp
6020 mono_arch_emit_prolog (MonoCompile *cfg)
6022 MonoMethod *method = cfg->method;
6024 MonoMethodSignature *sig;
6026 int alloc_size, orig_alloc_size, pos, max_offset, i, rot_amount, part;
6031 int prev_sp_offset, reg_offset;
6033 if (mono_jit_trace_calls != NULL && mono_trace_eval (method))
6036 sig = mono_method_signature (method);
6037 cfg->code_size = 256 + sig->param_count * 64;
6038 code = cfg->native_code = g_malloc (cfg->code_size);
6040 mono_emit_unwind_op_def_cfa (cfg, code, ARMREG_SP, 0);
6042 alloc_size = cfg->stack_offset;
6048 * The iphone uses R7 as the frame pointer, and it points at the saved
6053 * We can't use r7 as a frame pointer since it points into the middle of
6054 * the frame, so we keep using our own frame pointer.
6055 * FIXME: Optimize this.
6057 ARM_PUSH (code, (1 << ARMREG_R7) | (1 << ARMREG_LR));
6058 prev_sp_offset += 8; /* r7 and lr */
6059 mono_emit_unwind_op_def_cfa_offset (cfg, code, prev_sp_offset);
6060 mono_emit_unwind_op_offset (cfg, code, ARMREG_R7, (- prev_sp_offset) + 0);
6061 ARM_MOV_REG_REG (code, ARMREG_R7, ARMREG_SP);
6064 if (!method->save_lmf) {
6066 /* No need to push LR again */
6067 if (cfg->used_int_regs)
6068 ARM_PUSH (code, cfg->used_int_regs);
6070 ARM_PUSH (code, cfg->used_int_regs | (1 << ARMREG_LR));
6071 prev_sp_offset += 4;
6073 for (i = 0; i < 16; ++i) {
6074 if (cfg->used_int_regs & (1 << i))
6075 prev_sp_offset += 4;
6077 mono_emit_unwind_op_def_cfa_offset (cfg, code, prev_sp_offset);
6079 for (i = 0; i < 16; ++i) {
6080 if ((cfg->used_int_regs & (1 << i))) {
6081 mono_emit_unwind_op_offset (cfg, code, i, (- prev_sp_offset) + reg_offset);
6082 mini_gc_set_slot_type_from_cfa (cfg, (- prev_sp_offset) + reg_offset, SLOT_NOREF);
6086 mono_emit_unwind_op_offset (cfg, code, ARMREG_LR, -4);
6087 mini_gc_set_slot_type_from_cfa (cfg, -4, SLOT_NOREF);
6089 ARM_MOV_REG_REG (code, ARMREG_IP, ARMREG_SP);
6090 ARM_PUSH (code, 0x5ff0);
6091 prev_sp_offset += 4 * 10; /* all but r0-r3, sp and pc */
6092 mono_emit_unwind_op_def_cfa_offset (cfg, code, prev_sp_offset);
6094 for (i = 0; i < 16; ++i) {
6095 if ((i > ARMREG_R3) && (i != ARMREG_SP) && (i != ARMREG_PC)) {
6096 /* The original r7 is saved at the start */
6097 if (!(iphone_abi && i == ARMREG_R7))
6098 mono_emit_unwind_op_offset (cfg, code, i, (- prev_sp_offset) + reg_offset);
6102 g_assert (reg_offset == 4 * 10);
6103 pos += sizeof (MonoLMF) - (4 * 10);
6107 orig_alloc_size = alloc_size;
6108 // align to MONO_ARCH_FRAME_ALIGNMENT bytes
6109 if (alloc_size & (MONO_ARCH_FRAME_ALIGNMENT - 1)) {
6110 alloc_size += MONO_ARCH_FRAME_ALIGNMENT - 1;
6111 alloc_size &= ~(MONO_ARCH_FRAME_ALIGNMENT - 1);
6114 /* the stack used in the pushed regs */
6115 alloc_size += ALIGN_TO (prev_sp_offset, MONO_ARCH_FRAME_ALIGNMENT) - prev_sp_offset;
6116 cfg->stack_usage = alloc_size;
6118 if ((i = mono_arm_is_rotated_imm8 (alloc_size, &rot_amount)) >= 0) {
6119 ARM_SUB_REG_IMM (code, ARMREG_SP, ARMREG_SP, i, rot_amount);
6121 code = mono_arm_emit_load_imm (code, ARMREG_IP, alloc_size);
6122 ARM_SUB_REG_REG (code, ARMREG_SP, ARMREG_SP, ARMREG_IP);
6124 mono_emit_unwind_op_def_cfa_offset (cfg, code, prev_sp_offset + alloc_size);
6126 if (cfg->frame_reg != ARMREG_SP) {
6127 ARM_MOV_REG_REG (code, cfg->frame_reg, ARMREG_SP);
6128 mono_emit_unwind_op_def_cfa_reg (cfg, code, cfg->frame_reg);
6130 //g_print ("prev_sp_offset: %d, alloc_size:%d\n", prev_sp_offset, alloc_size);
6131 prev_sp_offset += alloc_size;
6133 for (i = 0; i < alloc_size - orig_alloc_size; i += 4)
6134 mini_gc_set_slot_type_from_cfa (cfg, (- prev_sp_offset) + orig_alloc_size + i, SLOT_NOREF);
6136 /* compute max_offset in order to use short forward jumps
6137 * we could skip do it on arm because the immediate displacement
6138 * for jumps is large enough, it may be useful later for constant pools
6141 for (bb = cfg->bb_entry; bb; bb = bb->next_bb) {
6142 MonoInst *ins = bb->code;
6143 bb->max_offset = max_offset;
6145 if (cfg->prof_options & MONO_PROFILE_COVERAGE)
6148 MONO_BB_FOR_EACH_INS (bb, ins)
6149 max_offset += ((guint8 *)ins_get_spec (ins->opcode))[MONO_INST_LEN];
6152 /* stack alignment check */
6156 ARM_MOV_REG_REG (code, ARMREG_LR, ARMREG_SP);
6157 code = mono_arm_emit_load_imm (code, ARMREG_IP, MONO_ARCH_FRAME_ALIGNMENT -1);
6158 ARM_AND_REG_REG (code, ARMREG_LR, ARMREG_LR, ARMREG_IP);
6159 ARM_CMP_REG_IMM (code, ARMREG_LR, 0, 0);
6161 ARM_B_COND (code, ARMCOND_EQ, 0);
6162 if (cfg->compile_aot)
6163 ARM_MOV_REG_IMM8 (code, ARMREG_R0, 0);
6165 code = mono_arm_emit_load_imm (code, ARMREG_R0, (guint32)cfg->method);
6166 mono_add_patch_info (cfg, code - cfg->native_code, MONO_PATCH_INFO_INTERNAL_METHOD, "mono_arm_unaligned_stack");
6167 code = emit_call_seq (cfg, code);
6168 arm_patch (buf [0], code);
6172 /* store runtime generic context */
6173 if (cfg->rgctx_var) {
6174 MonoInst *ins = cfg->rgctx_var;
6176 g_assert (ins->opcode == OP_REGOFFSET);
6178 if (arm_is_imm12 (ins->inst_offset)) {
6179 ARM_STR_IMM (code, MONO_ARCH_RGCTX_REG, ins->inst_basereg, ins->inst_offset);
6181 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_offset);
6182 ARM_STR_REG_REG (code, MONO_ARCH_RGCTX_REG, ins->inst_basereg, ARMREG_LR);
6186 /* load arguments allocated to register from the stack */
6189 cinfo = get_call_info (NULL, sig);
6191 if (cinfo->ret.storage == RegTypeStructByAddr) {
6192 ArgInfo *ainfo = &cinfo->ret;
6193 inst = cfg->vret_addr;
6194 g_assert (arm_is_imm12 (inst->inst_offset));
6195 ARM_STR_IMM (code, ainfo->reg, inst->inst_basereg, inst->inst_offset);
6198 if (sig->call_convention == MONO_CALL_VARARG) {
6199 ArgInfo *cookie = &cinfo->sig_cookie;
6201 /* Save the sig cookie address */
6202 g_assert (cookie->storage == RegTypeBase);
6204 g_assert (arm_is_imm12 (prev_sp_offset + cookie->offset));
6205 g_assert (arm_is_imm12 (cfg->sig_cookie));
6206 ARM_ADD_REG_IMM8 (code, ARMREG_IP, cfg->frame_reg, prev_sp_offset + cookie->offset);
6207 ARM_STR_IMM (code, ARMREG_IP, cfg->frame_reg, cfg->sig_cookie);
6210 for (i = 0; i < sig->param_count + sig->hasthis; ++i) {
6211 ArgInfo *ainfo = cinfo->args + i;
6212 inst = cfg->args [pos];
6214 if (cfg->verbose_level > 2)
6215 g_print ("Saving argument %d (type: %d)\n", i, ainfo->storage);
6217 if (inst->opcode == OP_REGVAR) {
6218 if (ainfo->storage == RegTypeGeneral)
6219 ARM_MOV_REG_REG (code, inst->dreg, ainfo->reg);
6220 else if (ainfo->storage == RegTypeFP) {
6221 g_assert_not_reached ();
6222 } else if (ainfo->storage == RegTypeBase) {
6223 if (arm_is_imm12 (prev_sp_offset + ainfo->offset)) {
6224 ARM_LDR_IMM (code, inst->dreg, ARMREG_SP, (prev_sp_offset + ainfo->offset));
6226 code = mono_arm_emit_load_imm (code, ARMREG_IP, prev_sp_offset + ainfo->offset);
6227 ARM_LDR_REG_REG (code, inst->dreg, ARMREG_SP, ARMREG_IP);
6230 g_assert_not_reached ();
6232 if (cfg->verbose_level > 2)
6233 g_print ("Argument %d assigned to register %s\n", pos, mono_arch_regname (inst->dreg));
6235 switch (ainfo->storage) {
6237 for (part = 0; part < ainfo->nregs; part ++) {
6238 if (ainfo->esize == 4)
6239 ARM_FSTS (code, ainfo->reg + part, inst->inst_basereg, inst->inst_offset + (part * ainfo->esize));
6241 ARM_FSTD (code, ainfo->reg + (part * 2), inst->inst_basereg, inst->inst_offset + (part * ainfo->esize));
6244 case RegTypeGeneral:
6245 case RegTypeIRegPair:
6246 case RegTypeGSharedVtInReg:
6247 case RegTypeStructByAddr:
6248 switch (ainfo->size) {
6250 if (arm_is_imm12 (inst->inst_offset))
6251 ARM_STRB_IMM (code, ainfo->reg, inst->inst_basereg, inst->inst_offset);
6253 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset);
6254 ARM_STRB_REG_REG (code, ainfo->reg, inst->inst_basereg, ARMREG_IP);
6258 if (arm_is_imm8 (inst->inst_offset)) {
6259 ARM_STRH_IMM (code, ainfo->reg, inst->inst_basereg, inst->inst_offset);
6261 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset);
6262 ARM_STRH_REG_REG (code, ainfo->reg, inst->inst_basereg, ARMREG_IP);
6266 if (arm_is_imm12 (inst->inst_offset)) {
6267 ARM_STR_IMM (code, ainfo->reg, inst->inst_basereg, inst->inst_offset);
6269 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset);
6270 ARM_STR_REG_REG (code, ainfo->reg, inst->inst_basereg, ARMREG_IP);
6272 if (arm_is_imm12 (inst->inst_offset + 4)) {
6273 ARM_STR_IMM (code, ainfo->reg + 1, inst->inst_basereg, inst->inst_offset + 4);
6275 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset + 4);
6276 ARM_STR_REG_REG (code, ainfo->reg + 1, inst->inst_basereg, ARMREG_IP);
6280 if (arm_is_imm12 (inst->inst_offset)) {
6281 ARM_STR_IMM (code, ainfo->reg, inst->inst_basereg, inst->inst_offset);
6283 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset);
6284 ARM_STR_REG_REG (code, ainfo->reg, inst->inst_basereg, ARMREG_IP);
6289 case RegTypeBaseGen:
6290 if (arm_is_imm12 (prev_sp_offset + ainfo->offset)) {
6291 ARM_LDR_IMM (code, ARMREG_LR, ARMREG_SP, (prev_sp_offset + ainfo->offset));
6293 code = mono_arm_emit_load_imm (code, ARMREG_IP, prev_sp_offset + ainfo->offset);
6294 ARM_LDR_REG_REG (code, ARMREG_LR, ARMREG_SP, ARMREG_IP);
6296 if (arm_is_imm12 (inst->inst_offset + 4)) {
6297 ARM_STR_IMM (code, ARMREG_LR, inst->inst_basereg, inst->inst_offset + 4);
6298 ARM_STR_IMM (code, ARMREG_R3, inst->inst_basereg, inst->inst_offset);
6300 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset + 4);
6301 ARM_STR_REG_REG (code, ARMREG_LR, inst->inst_basereg, ARMREG_IP);
6302 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset);
6303 ARM_STR_REG_REG (code, ARMREG_R3, inst->inst_basereg, ARMREG_IP);
6307 case RegTypeGSharedVtOnStack:
6308 case RegTypeStructByAddrOnStack:
6309 if (arm_is_imm12 (prev_sp_offset + ainfo->offset)) {
6310 ARM_LDR_IMM (code, ARMREG_LR, ARMREG_SP, (prev_sp_offset + ainfo->offset));
6312 code = mono_arm_emit_load_imm (code, ARMREG_IP, prev_sp_offset + ainfo->offset);
6313 ARM_LDR_REG_REG (code, ARMREG_LR, ARMREG_SP, ARMREG_IP);
6316 switch (ainfo->size) {
6318 if (arm_is_imm8 (inst->inst_offset)) {
6319 ARM_STRB_IMM (code, ARMREG_LR, inst->inst_basereg, inst->inst_offset);
6321 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset);
6322 ARM_STRB_REG_REG (code, ARMREG_LR, inst->inst_basereg, ARMREG_IP);
6326 if (arm_is_imm8 (inst->inst_offset)) {
6327 ARM_STRH_IMM (code, ARMREG_LR, inst->inst_basereg, inst->inst_offset);
6329 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset);
6330 ARM_STRH_REG_REG (code, ARMREG_LR, inst->inst_basereg, ARMREG_IP);
6334 if (arm_is_imm12 (inst->inst_offset)) {
6335 ARM_STR_IMM (code, ARMREG_LR, inst->inst_basereg, inst->inst_offset);
6337 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset);
6338 ARM_STR_REG_REG (code, ARMREG_LR, inst->inst_basereg, ARMREG_IP);
6340 if (arm_is_imm12 (prev_sp_offset + ainfo->offset + 4)) {
6341 ARM_LDR_IMM (code, ARMREG_LR, ARMREG_SP, (prev_sp_offset + ainfo->offset + 4));
6343 code = mono_arm_emit_load_imm (code, ARMREG_IP, prev_sp_offset + ainfo->offset + 4);
6344 ARM_LDR_REG_REG (code, ARMREG_LR, ARMREG_SP, ARMREG_IP);
6346 if (arm_is_imm12 (inst->inst_offset + 4)) {
6347 ARM_STR_IMM (code, ARMREG_LR, inst->inst_basereg, inst->inst_offset + 4);
6349 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset + 4);
6350 ARM_STR_REG_REG (code, ARMREG_LR, inst->inst_basereg, ARMREG_IP);
6354 if (arm_is_imm12 (inst->inst_offset)) {
6355 ARM_STR_IMM (code, ARMREG_LR, inst->inst_basereg, inst->inst_offset);
6357 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset);
6358 ARM_STR_REG_REG (code, ARMREG_LR, inst->inst_basereg, ARMREG_IP);
6364 int imm8, rot_amount;
6366 if ((imm8 = mono_arm_is_rotated_imm8 (inst->inst_offset, &rot_amount)) == -1) {
6367 code = mono_arm_emit_load_imm (code, ARMREG_IP, inst->inst_offset);
6368 ARM_ADD_REG_REG (code, ARMREG_IP, ARMREG_IP, inst->inst_basereg);
6370 ARM_ADD_REG_IMM (code, ARMREG_IP, inst->inst_basereg, imm8, rot_amount);
6372 if (ainfo->size == 8)
6373 ARM_FSTD (code, ainfo->reg, ARMREG_IP, 0);
6375 ARM_FSTS (code, ainfo->reg, ARMREG_IP, 0);
6378 case RegTypeStructByVal: {
6379 int doffset = inst->inst_offset;
6383 size = mini_type_stack_size_full (inst->inst_vtype, NULL, sig->pinvoke);
6384 for (cur_reg = 0; cur_reg < ainfo->size; ++cur_reg) {
6385 if (arm_is_imm12 (doffset)) {
6386 ARM_STR_IMM (code, ainfo->reg + cur_reg, inst->inst_basereg, doffset);
6388 code = mono_arm_emit_load_imm (code, ARMREG_IP, doffset);
6389 ARM_STR_REG_REG (code, ainfo->reg + cur_reg, inst->inst_basereg, ARMREG_IP);
6391 soffset += sizeof (gpointer);
6392 doffset += sizeof (gpointer);
6394 if (ainfo->vtsize) {
6395 /* FIXME: handle overrun! with struct sizes not multiple of 4 */
6396 //g_print ("emit_memcpy (prev_sp_ofs: %d, ainfo->offset: %d, soffset: %d)\n", prev_sp_offset, ainfo->offset, soffset);
6397 code = emit_memcpy (code, ainfo->vtsize * sizeof (gpointer), inst->inst_basereg, doffset, ARMREG_SP, prev_sp_offset + ainfo->offset);
6402 g_assert_not_reached ();
6409 if (method->save_lmf)
6410 code = emit_save_lmf (cfg, code, alloc_size - lmf_offset);
6413 code = mono_arch_instrument_prolog (cfg, mono_trace_enter_method, code, TRUE);
6415 if (cfg->arch.seq_point_info_var) {
6416 MonoInst *ins = cfg->arch.seq_point_info_var;
6418 /* Initialize the variable from a GOT slot */
6419 mono_add_patch_info (cfg, code - cfg->native_code, MONO_PATCH_INFO_SEQ_POINT_INFO, cfg->method);
6420 ARM_LDR_IMM (code, ARMREG_R0, ARMREG_PC, 0);
6422 *(gpointer*)code = NULL;
6424 ARM_LDR_REG_REG (code, ARMREG_R0, ARMREG_PC, ARMREG_R0);
6426 g_assert (ins->opcode == OP_REGOFFSET);
6428 if (arm_is_imm12 (ins->inst_offset)) {
6429 ARM_STR_IMM (code, ARMREG_R0, ins->inst_basereg, ins->inst_offset);
6431 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_offset);
6432 ARM_STR_REG_REG (code, ARMREG_R0, ins->inst_basereg, ARMREG_LR);
6436 /* Initialize ss_trigger_page_var */
6437 if (!cfg->soft_breakpoints) {
6438 MonoInst *info_var = cfg->arch.seq_point_info_var;
6439 MonoInst *ss_trigger_page_var = cfg->arch.ss_trigger_page_var;
6440 int dreg = ARMREG_LR;
6443 g_assert (info_var->opcode == OP_REGOFFSET);
6444 g_assert (arm_is_imm12 (info_var->inst_offset));
6446 ARM_LDR_IMM (code, dreg, info_var->inst_basereg, info_var->inst_offset);
6447 /* Load the trigger page addr */
6448 ARM_LDR_IMM (code, dreg, dreg, MONO_STRUCT_OFFSET (SeqPointInfo, ss_trigger_page));
6449 ARM_STR_IMM (code, dreg, ss_trigger_page_var->inst_basereg, ss_trigger_page_var->inst_offset);
6453 if (cfg->arch.seq_point_ss_method_var) {
6454 MonoInst *ss_method_ins = cfg->arch.seq_point_ss_method_var;
6455 MonoInst *bp_method_ins = cfg->arch.seq_point_bp_method_var;
6457 g_assert (ss_method_ins->opcode == OP_REGOFFSET);
6458 g_assert (arm_is_imm12 (ss_method_ins->inst_offset));
6460 if (cfg->compile_aot) {
6461 MonoInst *info_var = cfg->arch.seq_point_info_var;
6462 int dreg = ARMREG_LR;
6464 g_assert (info_var->opcode == OP_REGOFFSET);
6465 g_assert (arm_is_imm12 (info_var->inst_offset));
6467 ARM_LDR_IMM (code, dreg, info_var->inst_basereg, info_var->inst_offset);
6468 ARM_LDR_IMM (code, dreg, dreg, MONO_STRUCT_OFFSET (SeqPointInfo, ss_tramp_addr));
6469 ARM_STR_IMM (code, dreg, ss_method_ins->inst_basereg, ss_method_ins->inst_offset);
6471 g_assert (bp_method_ins->opcode == OP_REGOFFSET);
6472 g_assert (arm_is_imm12 (bp_method_ins->inst_offset));
6474 ARM_MOV_REG_REG (code, ARMREG_LR, ARMREG_PC);
6476 *(gpointer*)code = &single_step_tramp;
6478 *(gpointer*)code = breakpoint_tramp;
6481 ARM_LDR_IMM (code, ARMREG_IP, ARMREG_LR, 0);
6482 ARM_STR_IMM (code, ARMREG_IP, ss_method_ins->inst_basereg, ss_method_ins->inst_offset);
6483 ARM_LDR_IMM (code, ARMREG_IP, ARMREG_LR, 4);
6484 ARM_STR_IMM (code, ARMREG_IP, bp_method_ins->inst_basereg, bp_method_ins->inst_offset);
6488 cfg->code_len = code - cfg->native_code;
6489 g_assert (cfg->code_len < cfg->code_size);
6496 mono_arch_emit_epilog (MonoCompile *cfg)
6498 MonoMethod *method = cfg->method;
6499 int pos, i, rot_amount;
6500 int max_epilog_size = 16 + 20*4;
6504 if (cfg->method->save_lmf)
6505 max_epilog_size += 128;
6507 if (mono_jit_trace_calls != NULL)
6508 max_epilog_size += 50;
6510 while (cfg->code_len + max_epilog_size > (cfg->code_size - 16)) {
6511 cfg->code_size *= 2;
6512 cfg->native_code = g_realloc (cfg->native_code, cfg->code_size);
6513 cfg->stat_code_reallocs++;
6517 * Keep in sync with OP_JMP
6519 code = cfg->native_code + cfg->code_len;
6521 /* Save the uwind state which is needed by the out-of-line code */
6522 mono_emit_unwind_op_remember_state (cfg, code);
6524 if (mono_jit_trace_calls != NULL && mono_trace_eval (method)) {
6525 code = mono_arch_instrument_epilog (cfg, mono_trace_leave_method, code, TRUE);
6529 /* Load returned vtypes into registers if needed */
6530 cinfo = cfg->arch.cinfo;
6531 switch (cinfo->ret.storage) {
6532 case RegTypeStructByVal: {
6533 MonoInst *ins = cfg->ret;
6535 if (cinfo->ret.nregs == 1) {
6536 if (arm_is_imm12 (ins->inst_offset)) {
6537 ARM_LDR_IMM (code, ARMREG_R0, ins->inst_basereg, ins->inst_offset);
6539 code = mono_arm_emit_load_imm (code, ARMREG_LR, ins->inst_offset);
6540 ARM_LDR_REG_REG (code, ARMREG_R0, ins->inst_basereg, ARMREG_LR);
6543 for (i = 0; i < cinfo->ret.nregs; ++i) {
6544 int offset = ins->inst_offset + (i * 4);
6545 if (arm_is_imm12 (offset)) {
6546 ARM_LDR_IMM (code, i, ins->inst_basereg, offset);
6548 code = mono_arm_emit_load_imm (code, ARMREG_LR, offset);
6549 ARM_LDR_REG_REG (code, i, ins->inst_basereg, ARMREG_LR);
6556 MonoInst *ins = cfg->ret;
6558 for (i = 0; i < cinfo->ret.nregs; ++i) {
6559 if (cinfo->ret.esize == 4)
6560 ARM_FLDS (code, cinfo->ret.reg + i, ins->inst_basereg, ins->inst_offset + (i * cinfo->ret.esize));
6562 ARM_FLDD (code, cinfo->ret.reg + (i * 2), ins->inst_basereg, ins->inst_offset + (i * cinfo->ret.esize));
6570 if (method->save_lmf) {
6571 int lmf_offset, reg, sp_adj, regmask, nused_int_regs = 0;
6572 /* all but r0-r3, sp and pc */
6573 pos += sizeof (MonoLMF) - (MONO_ARM_NUM_SAVED_REGS * sizeof (mgreg_t));
6576 code = emit_restore_lmf (cfg, code, cfg->stack_usage - lmf_offset);
6578 /* This points to r4 inside MonoLMF->iregs */
6579 sp_adj = (sizeof (MonoLMF) - MONO_ARM_NUM_SAVED_REGS * sizeof (mgreg_t));
6581 regmask = 0x9ff0; /* restore lr to pc */
6582 /* Skip caller saved registers not used by the method */
6583 while (!(cfg->used_int_regs & (1 << reg)) && reg < ARMREG_FP) {
6584 regmask &= ~(1 << reg);
6589 /* Restored later */
6590 regmask &= ~(1 << ARMREG_PC);
6591 /* point sp at the registers to restore: 10 is 14 -4, because we skip r0-r3 */
6592 code = emit_big_add (code, ARMREG_SP, cfg->frame_reg, cfg->stack_usage - lmf_offset + sp_adj);
6593 for (i = 0; i < 16; i++) {
6594 if (regmask & (1 << i))
6597 mono_emit_unwind_op_def_cfa (cfg, code, ARMREG_SP, ((iphone_abi ? 3 : 0) + nused_int_regs) * 4);
6599 ARM_POP (code, regmask);
6601 for (i = 0; i < 16; i++) {
6602 if (regmask & (1 << i))
6603 mono_emit_unwind_op_same_value (cfg, code, i);
6605 /* Restore saved r7, restore LR to PC */
6606 /* Skip lr from the lmf */
6607 mono_emit_unwind_op_def_cfa_offset (cfg, code, 3 * 4);
6608 ARM_ADD_REG_IMM (code, ARMREG_SP, ARMREG_SP, sizeof (gpointer), 0);
6609 mono_emit_unwind_op_def_cfa_offset (cfg, code, 2 * 4);
6610 ARM_POP (code, (1 << ARMREG_R7) | (1 << ARMREG_PC));
6613 int i, nused_int_regs = 0;
6615 for (i = 0; i < 16; i++) {
6616 if (cfg->used_int_regs & (1 << i))
6620 if ((i = mono_arm_is_rotated_imm8 (cfg->stack_usage, &rot_amount)) >= 0) {
6621 ARM_ADD_REG_IMM (code, ARMREG_SP, cfg->frame_reg, i, rot_amount);
6623 code = mono_arm_emit_load_imm (code, ARMREG_IP, cfg->stack_usage);
6624 ARM_ADD_REG_REG (code, ARMREG_SP, cfg->frame_reg, ARMREG_IP);
6627 if (cfg->frame_reg != ARMREG_SP) {
6628 mono_emit_unwind_op_def_cfa_reg (cfg, code, ARMREG_SP);
6632 /* Restore saved gregs */
6633 if (cfg->used_int_regs) {
6634 mono_emit_unwind_op_def_cfa_offset (cfg, code, (2 + nused_int_regs) * 4);
6635 ARM_POP (code, cfg->used_int_regs);
6636 for (i = 0; i < 16; i++) {
6637 if (cfg->used_int_regs & (1 << i))
6638 mono_emit_unwind_op_same_value (cfg, code, i);
6641 mono_emit_unwind_op_def_cfa_offset (cfg, code, 2 * 4);
6642 /* Restore saved r7, restore LR to PC */
6643 ARM_POP (code, (1 << ARMREG_R7) | (1 << ARMREG_PC));
6645 mono_emit_unwind_op_def_cfa_offset (cfg, code, (nused_int_regs + 1) * 4);
6646 ARM_POP (code, cfg->used_int_regs | (1 << ARMREG_PC));
6650 /* Restore the unwind state to be the same as before the epilog */
6651 mono_emit_unwind_op_restore_state (cfg, code);
6653 cfg->code_len = code - cfg->native_code;
6655 g_assert (cfg->code_len < cfg->code_size);
6660 mono_arch_emit_exceptions (MonoCompile *cfg)
6662 MonoJumpInfo *patch_info;
6665 guint8* exc_throw_pos [MONO_EXC_INTRINS_NUM];
6666 guint8 exc_throw_found [MONO_EXC_INTRINS_NUM];
6667 int max_epilog_size = 50;
6669 for (i = 0; i < MONO_EXC_INTRINS_NUM; i++) {
6670 exc_throw_pos [i] = NULL;
6671 exc_throw_found [i] = 0;
6674 /* count the number of exception infos */
6677 * make sure we have enough space for exceptions
6679 for (patch_info = cfg->patch_info; patch_info; patch_info = patch_info->next) {
6680 if (patch_info->type == MONO_PATCH_INFO_EXC) {
6681 i = mini_exception_id_by_name (patch_info->data.target);
6682 if (!exc_throw_found [i]) {
6683 max_epilog_size += 32;
6684 exc_throw_found [i] = TRUE;
6689 while (cfg->code_len + max_epilog_size > (cfg->code_size - 16)) {
6690 cfg->code_size *= 2;
6691 cfg->native_code = g_realloc (cfg->native_code, cfg->code_size);
6692 cfg->stat_code_reallocs++;
6695 code = cfg->native_code + cfg->code_len;
6697 /* add code to raise exceptions */
6698 for (patch_info = cfg->patch_info; patch_info; patch_info = patch_info->next) {
6699 switch (patch_info->type) {
6700 case MONO_PATCH_INFO_EXC: {
6701 MonoClass *exc_class;
6702 unsigned char *ip = patch_info->ip.i + cfg->native_code;
6704 i = mini_exception_id_by_name (patch_info->data.target);
6705 if (exc_throw_pos [i]) {
6706 arm_patch (ip, exc_throw_pos [i]);
6707 patch_info->type = MONO_PATCH_INFO_NONE;
6710 exc_throw_pos [i] = code;
6712 arm_patch (ip, code);
6714 exc_class = mono_class_load_from_name (mono_defaults.corlib, "System", patch_info->data.name);
6716 ARM_MOV_REG_REG (code, ARMREG_R1, ARMREG_LR);
6717 ARM_LDR_IMM (code, ARMREG_R0, ARMREG_PC, 0);
6718 patch_info->type = MONO_PATCH_INFO_INTERNAL_METHOD;
6719 patch_info->data.name = "mono_arch_throw_corlib_exception";
6720 patch_info->ip.i = code - cfg->native_code;
6722 cfg->thunk_area += THUNK_SIZE;
6723 *(guint32*)(gpointer)code = exc_class->type_token - MONO_TOKEN_TYPE_DEF;
6733 cfg->code_len = code - cfg->native_code;
6735 g_assert (cfg->code_len < cfg->code_size);
6739 #endif /* #ifndef DISABLE_JIT */
6742 mono_arch_finish_init (void)
6747 mono_arch_free_jit_tls_data (MonoJitTlsData *tls)
6752 mono_arch_emit_inst_for_method (MonoCompile *cfg, MonoMethod *cmethod, MonoMethodSignature *fsig, MonoInst **args)
6759 mono_arch_print_tree (MonoInst *tree, int arity)
6769 mono_arch_get_patch_offset (guint8 *code)
6776 mono_arch_flush_register_windows (void)
6781 mono_arch_find_imt_method (mgreg_t *regs, guint8 *code)
6783 return (MonoMethod*)regs [MONO_ARCH_IMT_REG];
6787 mono_arch_find_static_call_vtable (mgreg_t *regs, guint8 *code)
6789 return (MonoVTable*) regs [MONO_ARCH_RGCTX_REG];
6793 mono_arch_get_cie_program (void)
6797 mono_add_unwind_op_def_cfa (l, (guint8*)NULL, (guint8*)NULL, ARMREG_SP, 0);
6802 /* #define ENABLE_WRONG_METHOD_CHECK 1 */
6803 #define BASE_SIZE (6 * 4)
6804 #define BSEARCH_ENTRY_SIZE (4 * 4)
6805 #define CMP_SIZE (3 * 4)
6806 #define BRANCH_SIZE (1 * 4)
6807 #define CALL_SIZE (2 * 4)
6808 #define WMC_SIZE (8 * 4)
6809 #define DISTANCE(A, B) (((gint32)(B)) - ((gint32)(A)))
6812 arm_emit_value_and_patch_ldr (arminstr_t *code, arminstr_t *target, guint32 value)
6814 guint32 delta = DISTANCE (target, code);
6816 g_assert (delta >= 0 && delta <= 0xFFF);
6817 *target = *target | delta;
6822 #ifdef ENABLE_WRONG_METHOD_CHECK
6824 mini_dump_bad_imt (int input_imt, int compared_imt, int pc)
6826 g_print ("BAD IMT comparing %x with expected %x at ip %x", input_imt, compared_imt, pc);
6832 mono_arch_build_imt_trampoline (MonoVTable *vtable, MonoDomain *domain, MonoIMTCheckItem **imt_entries, int count,
6833 gpointer fail_tramp)
6836 arminstr_t *code, *start;
6837 gboolean large_offsets = FALSE;
6838 guint32 **constant_pool_starts;
6839 arminstr_t *vtable_target = NULL;
6840 int extra_space = 0;
6841 #ifdef ENABLE_WRONG_METHOD_CHECK
6847 constant_pool_starts = g_new0 (guint32*, count);
6849 for (i = 0; i < count; ++i) {
6850 MonoIMTCheckItem *item = imt_entries [i];
6851 if (item->is_equals) {
6852 gboolean fail_case = !item->check_target_idx && fail_tramp;
6854 if (item->has_target_code || !arm_is_imm12 (DISTANCE (vtable, &vtable->vtable[item->value.vtable_slot]))) {
6855 item->chunk_size += 32;
6856 large_offsets = TRUE;
6859 if (item->check_target_idx || fail_case) {
6860 if (!item->compare_done || fail_case)
6861 item->chunk_size += CMP_SIZE;
6862 item->chunk_size += BRANCH_SIZE;
6864 #ifdef ENABLE_WRONG_METHOD_CHECK
6865 item->chunk_size += WMC_SIZE;
6869 item->chunk_size += 16;
6870 large_offsets = TRUE;
6872 item->chunk_size += CALL_SIZE;
6874 item->chunk_size += BSEARCH_ENTRY_SIZE;
6875 imt_entries [item->check_target_idx]->compare_done = TRUE;
6877 size += item->chunk_size;
6881 size += 4 * count; /* The ARM_ADD_REG_IMM to pop the stack */
6884 code = mono_method_alloc_generic_virtual_trampoline (domain, size);
6886 code = mono_domain_code_reserve (domain, size);
6889 unwind_ops = mono_arch_get_cie_program ();
6892 g_print ("Building IMT trampoline for class %s %s entries %d code size %d code at %p end %p vtable %p fail_tramp %p\n", vtable->klass->name_space, vtable->klass->name, count, size, start, ((guint8*)start) + size, vtable, fail_tramp);
6893 for (i = 0; i < count; ++i) {
6894 MonoIMTCheckItem *item = imt_entries [i];
6895 g_print ("method %d (%p) %s vtable slot %p is_equals %d chunk size %d\n", i, item->key, ((MonoMethod*)item->key)->name, &vtable->vtable [item->value.vtable_slot], item->is_equals, item->chunk_size);
6899 if (large_offsets) {
6900 ARM_PUSH4 (code, ARMREG_R0, ARMREG_R1, ARMREG_IP, ARMREG_PC);
6901 mono_add_unwind_op_def_cfa_offset (unwind_ops, code, start, 4 * sizeof (mgreg_t));
6903 ARM_PUSH2 (code, ARMREG_R0, ARMREG_R1);
6904 mono_add_unwind_op_def_cfa_offset (unwind_ops, code, start, 2 * sizeof (mgreg_t));
6906 ARM_LDR_IMM (code, ARMREG_R0, ARMREG_LR, -4);
6907 vtable_target = code;
6908 ARM_LDR_IMM (code, ARMREG_IP, ARMREG_PC, 0);
6909 ARM_MOV_REG_REG (code, ARMREG_R0, ARMREG_V5);
6911 for (i = 0; i < count; ++i) {
6912 MonoIMTCheckItem *item = imt_entries [i];
6913 arminstr_t *imt_method = NULL, *vtable_offset_ins = NULL, *target_code_ins = NULL;
6914 gint32 vtable_offset;
6916 item->code_target = (guint8*)code;
6918 if (item->is_equals) {
6919 gboolean fail_case = !item->check_target_idx && fail_tramp;
6921 if (item->check_target_idx || fail_case) {
6922 if (!item->compare_done || fail_case) {
6924 ARM_LDR_IMM (code, ARMREG_R1, ARMREG_PC, 0);
6925 ARM_CMP_REG_REG (code, ARMREG_R0, ARMREG_R1);
6927 item->jmp_code = (guint8*)code;
6928 ARM_B_COND (code, ARMCOND_NE, 0);
6930 /*Enable the commented code to assert on wrong method*/
6931 #ifdef ENABLE_WRONG_METHOD_CHECK
6933 ARM_LDR_IMM (code, ARMREG_R1, ARMREG_PC, 0);
6934 ARM_CMP_REG_REG (code, ARMREG_R0, ARMREG_R1);
6936 ARM_B_COND (code, ARMCOND_EQ, 0);
6938 /* Define this if your system is so bad that gdb is failing. */
6939 #ifdef BROKEN_DEV_ENV
6940 ARM_MOV_REG_REG (code, ARMREG_R2, ARMREG_PC);
6942 arm_patch (code - 1, mini_dump_bad_imt);
6946 arm_patch (cond, code);
6950 if (item->has_target_code) {
6951 /* Load target address */
6952 target_code_ins = code;
6953 ARM_LDR_IMM (code, ARMREG_R1, ARMREG_PC, 0);
6954 /* Save it to the fourth slot */
6955 ARM_STR_IMM (code, ARMREG_R1, ARMREG_SP, 3 * sizeof (gpointer));
6956 /* Restore registers and branch */
6957 ARM_POP4 (code, ARMREG_R0, ARMREG_R1, ARMREG_IP, ARMREG_PC);
6959 code = arm_emit_value_and_patch_ldr (code, target_code_ins, (gsize)item->value.target_code);
6961 vtable_offset = DISTANCE (vtable, &vtable->vtable[item->value.vtable_slot]);
6962 if (!arm_is_imm12 (vtable_offset)) {
6964 * We need to branch to a computed address but we don't have
6965 * a free register to store it, since IP must contain the
6966 * vtable address. So we push the two values to the stack, and
6967 * load them both using LDM.
6969 /* Compute target address */
6970 vtable_offset_ins = code;
6971 ARM_LDR_IMM (code, ARMREG_R1, ARMREG_PC, 0);
6972 ARM_LDR_REG_REG (code, ARMREG_R1, ARMREG_IP, ARMREG_R1);
6973 /* Save it to the fourth slot */
6974 ARM_STR_IMM (code, ARMREG_R1, ARMREG_SP, 3 * sizeof (gpointer));
6975 /* Restore registers and branch */
6976 ARM_POP4 (code, ARMREG_R0, ARMREG_R1, ARMREG_IP, ARMREG_PC);
6978 code = arm_emit_value_and_patch_ldr (code, vtable_offset_ins, vtable_offset);
6980 ARM_POP2 (code, ARMREG_R0, ARMREG_R1);
6981 if (large_offsets) {
6982 mono_add_unwind_op_def_cfa_offset (unwind_ops, code, start, 2 * sizeof (mgreg_t));
6983 ARM_ADD_REG_IMM8 (code, ARMREG_SP, ARMREG_SP, 2 * sizeof (gpointer));
6985 mono_add_unwind_op_def_cfa_offset (unwind_ops, code, start, 0);
6986 ARM_LDR_IMM (code, ARMREG_PC, ARMREG_IP, vtable_offset);
6991 arm_patch (item->jmp_code, (guchar*)code);
6993 target_code_ins = code;
6994 /* Load target address */
6995 ARM_LDR_IMM (code, ARMREG_R1, ARMREG_PC, 0);
6996 /* Save it to the fourth slot */
6997 ARM_STR_IMM (code, ARMREG_R1, ARMREG_SP, 3 * sizeof (gpointer));
6998 /* Restore registers and branch */
6999 ARM_POP4 (code, ARMREG_R0, ARMREG_R1, ARMREG_IP, ARMREG_PC);
7001 code = arm_emit_value_and_patch_ldr (code, target_code_ins, (gsize)fail_tramp);
7002 item->jmp_code = NULL;
7006 code = arm_emit_value_and_patch_ldr (code, imt_method, (guint32)item->key);
7008 /*must emit after unconditional branch*/
7009 if (vtable_target) {
7010 code = arm_emit_value_and_patch_ldr (code, vtable_target, (guint32)vtable);
7011 item->chunk_size += 4;
7012 vtable_target = NULL;
7015 /*We reserve the space for bsearch IMT values after the first entry with an absolute jump*/
7016 constant_pool_starts [i] = code;
7018 code += extra_space;
7022 ARM_LDR_IMM (code, ARMREG_R1, ARMREG_PC, 0);
7023 ARM_CMP_REG_REG (code, ARMREG_R0, ARMREG_R1);
7025 item->jmp_code = (guint8*)code;
7026 ARM_B_COND (code, ARMCOND_HS, 0);
7031 for (i = 0; i < count; ++i) {
7032 MonoIMTCheckItem *item = imt_entries [i];
7033 if (item->jmp_code) {
7034 if (item->check_target_idx)
7035 arm_patch (item->jmp_code, imt_entries [item->check_target_idx]->code_target);
7037 if (i > 0 && item->is_equals) {
7039 arminstr_t *space_start = constant_pool_starts [i];
7040 for (j = i - 1; j >= 0 && !imt_entries [j]->is_equals; --j) {
7041 space_start = arm_emit_value_and_patch_ldr (space_start, (arminstr_t*)imt_entries [j]->code_target, (guint32)imt_entries [j]->key);
7048 char *buff = g_strdup_printf ("thunk_for_class_%s_%s_entries_%d", vtable->klass->name_space, vtable->klass->name, count);
7049 mono_disassemble_code (NULL, (guint8*)start, size, buff);
7054 g_free (constant_pool_starts);
7056 mono_arch_flush_icache ((guint8*)start, size);
7057 mono_profiler_code_buffer_new (start, code - start, MONO_PROFILER_CODE_BUFFER_IMT_TRAMPOLINE, NULL);
7058 mono_stats.imt_trampolines_size += code - start;
7060 g_assert (DISTANCE (start, code) <= size);
7062 mono_tramp_info_register (mono_tramp_info_create (NULL, (guint8*)start, DISTANCE (start, code), NULL, unwind_ops), domain);
7068 mono_arch_context_get_int_reg (MonoContext *ctx, int reg)
7070 return ctx->regs [reg];
7074 mono_arch_context_set_int_reg (MonoContext *ctx, int reg, mgreg_t val)
7076 ctx->regs [reg] = val;
7080 * mono_arch_get_trampolines:
7082 * Return a list of MonoTrampInfo structures describing arch specific trampolines
7086 mono_arch_get_trampolines (gboolean aot)
7088 return mono_arm_get_exception_trampolines (aot);
7092 mono_arch_install_handler_block_guard (MonoJitInfo *ji, MonoJitExceptionInfo *clause, MonoContext *ctx, gpointer new_value)
7099 bp = MONO_CONTEXT_GET_BP (ctx);
7100 lr_loc = (gpointer*)(bp + clause->exvar_offset);
7102 old_value = *lr_loc;
7103 if ((char*)old_value < (char*)ji->code_start || (char*)old_value > ((char*)ji->code_start + ji->code_size))
7106 *lr_loc = new_value;
7111 #if defined(MONO_ARCH_SOFT_DEBUG_SUPPORTED)
7113 * mono_arch_set_breakpoint:
7115 * Set a breakpoint at the native code corresponding to JI at NATIVE_OFFSET.
7116 * The location should contain code emitted by OP_SEQ_POINT.
7119 mono_arch_set_breakpoint (MonoJitInfo *ji, guint8 *ip)
7122 guint32 native_offset = ip - (guint8*)ji->code_start;
7123 MonoDebugOptions *opt = mini_get_debug_options ();
7126 SeqPointInfo *info = mono_arch_get_seq_point_info (mono_domain_get (), ji->code_start);
7128 if (!breakpoint_tramp)
7129 breakpoint_tramp = mini_get_breakpoint_trampoline ();
7131 g_assert (native_offset % 4 == 0);
7132 g_assert (info->bp_addrs [native_offset / 4] == 0);
7133 info->bp_addrs [native_offset / 4] = opt->soft_breakpoints ? breakpoint_tramp : bp_trigger_page;
7134 } else if (opt->soft_breakpoints) {
7136 ARM_BLX_REG (code, ARMREG_LR);
7137 mono_arch_flush_icache (code - 4, 4);
7139 int dreg = ARMREG_LR;
7141 /* Read from another trigger page */
7142 ARM_LDR_IMM (code, dreg, ARMREG_PC, 0);
7144 *(int*)code = (int)bp_trigger_page;
7146 ARM_LDR_IMM (code, dreg, dreg, 0);
7148 mono_arch_flush_icache (code - 16, 16);
7151 /* This is currently implemented by emitting an SWI instruction, which
7152 * qemu/linux seems to convert to a SIGILL.
7154 *(int*)code = (0xef << 24) | 8;
7156 mono_arch_flush_icache (code - 4, 4);
7162 * mono_arch_clear_breakpoint:
7164 * Clear the breakpoint at IP.
7167 mono_arch_clear_breakpoint (MonoJitInfo *ji, guint8 *ip)
7169 MonoDebugOptions *opt = mini_get_debug_options ();
7174 guint32 native_offset = ip - (guint8*)ji->code_start;
7175 SeqPointInfo *info = mono_arch_get_seq_point_info (mono_domain_get (), ji->code_start);
7177 if (!breakpoint_tramp)
7178 breakpoint_tramp = mini_get_breakpoint_trampoline ();
7180 g_assert (native_offset % 4 == 0);
7181 g_assert (info->bp_addrs [native_offset / 4] == (opt->soft_breakpoints ? breakpoint_tramp : bp_trigger_page));
7182 info->bp_addrs [native_offset / 4] = 0;
7183 } else if (opt->soft_breakpoints) {
7186 mono_arch_flush_icache (code - 4, 4);
7188 for (i = 0; i < 4; ++i)
7191 mono_arch_flush_icache (ip, code - ip);
7196 * mono_arch_start_single_stepping:
7198 * Start single stepping.
7201 mono_arch_start_single_stepping (void)
7203 if (ss_trigger_page)
7204 mono_mprotect (ss_trigger_page, mono_pagesize (), 0);
7206 single_step_tramp = mini_get_single_step_trampoline ();
7210 * mono_arch_stop_single_stepping:
7212 * Stop single stepping.
7215 mono_arch_stop_single_stepping (void)
7217 if (ss_trigger_page)
7218 mono_mprotect (ss_trigger_page, mono_pagesize (), MONO_MMAP_READ);
7220 single_step_tramp = NULL;
7224 #define DBG_SIGNAL SIGBUS
7226 #define DBG_SIGNAL SIGSEGV
7230 * mono_arch_is_single_step_event:
7232 * Return whenever the machine state in SIGCTX corresponds to a single
7236 mono_arch_is_single_step_event (void *info, void *sigctx)
7238 siginfo_t *sinfo = info;
7240 if (!ss_trigger_page)
7243 /* Sometimes the address is off by 4 */
7244 if (sinfo->si_addr >= ss_trigger_page && (guint8*)sinfo->si_addr <= (guint8*)ss_trigger_page + 128)
7251 * mono_arch_is_breakpoint_event:
7253 * Return whenever the machine state in SIGCTX corresponds to a breakpoint event.
7256 mono_arch_is_breakpoint_event (void *info, void *sigctx)
7258 siginfo_t *sinfo = info;
7260 if (!ss_trigger_page)
7263 if (sinfo->si_signo == DBG_SIGNAL) {
7264 /* Sometimes the address is off by 4 */
7265 if (sinfo->si_addr >= bp_trigger_page && (guint8*)sinfo->si_addr <= (guint8*)bp_trigger_page + 128)
7275 * mono_arch_skip_breakpoint:
7277 * See mini-amd64.c for docs.
7280 mono_arch_skip_breakpoint (MonoContext *ctx, MonoJitInfo *ji)
7282 MONO_CONTEXT_SET_IP (ctx, (guint8*)MONO_CONTEXT_GET_IP (ctx) + 4);
7286 * mono_arch_skip_single_step:
7288 * See mini-amd64.c for docs.
7291 mono_arch_skip_single_step (MonoContext *ctx)
7293 MONO_CONTEXT_SET_IP (ctx, (guint8*)MONO_CONTEXT_GET_IP (ctx) + 4);
7296 #endif /* MONO_ARCH_SOFT_DEBUG_SUPPORTED */
7299 * mono_arch_get_seq_point_info:
7301 * See mini-amd64.c for docs.
7304 mono_arch_get_seq_point_info (MonoDomain *domain, guint8 *code)
7309 // FIXME: Add a free function
7311 mono_domain_lock (domain);
7312 info = g_hash_table_lookup (domain_jit_info (domain)->arch_seq_points,
7314 mono_domain_unlock (domain);
7317 ji = mono_jit_info_table_find (domain, (char*)code);
7320 info = g_malloc0 (sizeof (SeqPointInfo) + ji->code_size);
7322 info->ss_trigger_page = ss_trigger_page;
7323 info->bp_trigger_page = bp_trigger_page;
7324 info->ss_tramp_addr = &single_step_tramp;
7326 mono_domain_lock (domain);
7327 g_hash_table_insert (domain_jit_info (domain)->arch_seq_points,
7329 mono_domain_unlock (domain);
7336 mono_arch_init_lmf_ext (MonoLMFExt *ext, gpointer prev_lmf)
7338 ext->lmf.previous_lmf = prev_lmf;
7339 /* Mark that this is a MonoLMFExt */
7340 ext->lmf.previous_lmf = (gpointer)(((gssize)ext->lmf.previous_lmf) | 2);
7341 ext->lmf.sp = (gssize)ext;
7345 * mono_arch_set_target:
7347 * Set the target architecture the JIT backend should generate code for, in the form
7348 * of a GNU target triplet. Only used in AOT mode.
7351 mono_arch_set_target (char *mtriple)
7353 /* The GNU target triple format is not very well documented */
7354 if (strstr (mtriple, "armv7")) {
7355 v5_supported = TRUE;
7356 v6_supported = TRUE;
7357 v7_supported = TRUE;
7359 if (strstr (mtriple, "armv6")) {
7360 v5_supported = TRUE;
7361 v6_supported = TRUE;
7363 if (strstr (mtriple, "armv7s")) {
7364 v7s_supported = TRUE;
7366 if (strstr (mtriple, "armv7k")) {
7367 v7k_supported = TRUE;
7369 if (strstr (mtriple, "thumbv7s")) {
7370 v5_supported = TRUE;
7371 v6_supported = TRUE;
7372 v7_supported = TRUE;
7373 v7s_supported = TRUE;
7374 thumb_supported = TRUE;
7375 thumb2_supported = TRUE;
7377 if (strstr (mtriple, "darwin") || strstr (mtriple, "ios")) {
7378 v5_supported = TRUE;
7379 v6_supported = TRUE;
7380 thumb_supported = TRUE;
7383 if (strstr (mtriple, "gnueabi"))
7384 eabi_supported = TRUE;
7388 mono_arch_opcode_supported (int opcode)
7391 case OP_ATOMIC_ADD_I4:
7392 case OP_ATOMIC_EXCHANGE_I4:
7393 case OP_ATOMIC_CAS_I4:
7394 case OP_ATOMIC_LOAD_I1:
7395 case OP_ATOMIC_LOAD_I2:
7396 case OP_ATOMIC_LOAD_I4:
7397 case OP_ATOMIC_LOAD_U1:
7398 case OP_ATOMIC_LOAD_U2:
7399 case OP_ATOMIC_LOAD_U4:
7400 case OP_ATOMIC_STORE_I1:
7401 case OP_ATOMIC_STORE_I2:
7402 case OP_ATOMIC_STORE_I4:
7403 case OP_ATOMIC_STORE_U1:
7404 case OP_ATOMIC_STORE_U2:
7405 case OP_ATOMIC_STORE_U4:
7406 return v7_supported;
7407 case OP_ATOMIC_LOAD_R4:
7408 case OP_ATOMIC_LOAD_R8:
7409 case OP_ATOMIC_STORE_R4:
7410 case OP_ATOMIC_STORE_R8:
7411 return v7_supported && IS_VFP;
7418 mono_arch_get_call_info (MonoMemPool *mp, MonoMethodSignature *sig)
7420 return get_call_info (mp, sig);
7424 mono_arch_get_get_tls_tramp (void)
7430 emit_aotconst (MonoCompile *cfg, guint8 *code, int dreg, int patch_type, gpointer data)
7433 mono_add_patch_info (cfg, code - cfg->native_code, patch_type, data);
7434 ARM_LDR_IMM (code, dreg, ARMREG_PC, 0);
7436 *(gpointer*)code = NULL;
7438 /* Load the value from the GOT */
7439 ARM_LDR_REG_REG (code, dreg, ARMREG_PC, dreg);
7444 mono_arm_emit_aotconst (gpointer ji_list, guint8 *code, guint8 *buf, int dreg, int patch_type, gconstpointer data)
7446 MonoJumpInfo **ji = (MonoJumpInfo**)ji_list;
7448 *ji = mono_patch_info_list_prepend (*ji, code - buf, patch_type, data);
7449 ARM_LDR_IMM (code, dreg, ARMREG_PC, 0);
7451 *(gpointer*)code = NULL;
7453 ARM_LDR_REG_REG (code, dreg, ARMREG_PC, dreg);