* Dietmar Maurer (dietmar@ximian.com)
* Paolo Molaro (lupus@ximian.com)
* Carlos Valiente <yo@virutass.net>
+ * Andreas Faerber <andreas.faerber@web.de>
*
* (C) 2001 Ximian, Inc.
+ * (C) 2007-2008 Andreas Faerber
*/
#include <config.h>
#include "mini.h"
#include "mini-ppc.h"
+static guint8* nullified_class_init_trampoline;
+
+/* Same as mono_create_ftnptr, but doesn't require a domain */
+static gpointer
+mono_ppc_create_ftnptr (guint8 *code)
+{
+#ifdef PPC_USES_FUNCTION_DESCRIPTOR
+ MonoPPCFunctionDescriptor *ftnptr = mono_global_codeman_reserve (sizeof (MonoPPCFunctionDescriptor));
+
+ ftnptr->code = code;
+ ftnptr->toc = NULL;
+ ftnptr->env = NULL;
+
+ return ftnptr;
+#else
+ return code;
+#endif
+}
+
+/*
+ * Return the instruction to jump from code to target, 0 if not
+ * reachable with a single instruction
+ */
+static guint32
+branch_for_target_reachable (guint8 *branch, guint8 *target)
+{
+ gint diff = target - branch;
+ g_assert ((diff & 3) == 0);
+ if (diff >= 0) {
+ if (diff <= 33554431)
+ return (18 << 26) | (diff);
+ } else {
+ /* diff between 0 and -33554432 */
+ if (diff >= -33554432)
+ return (18 << 26) | (diff & ~0xfc000000);
+ }
+ return 0;
+}
+
/*
* get_unbox_trampoline:
* @m: method pointer
* this argument. This method returns a pointer to a trampoline which does
* unboxing before calling the method
*/
-static gpointer
-get_unbox_trampoline (MonoMethod *m, gpointer addr)
+gpointer
+mono_arch_get_unbox_trampoline (MonoMethod *m, gpointer addr)
{
guint8 *code, *start;
int this_pos = 3;
+ guint32 short_branch;
MonoDomain *domain = mono_domain_get ();
+ int size = MONO_PPC_32_64_CASE (20, 32) + PPC_FTNPTR_SIZE;
+
+ addr = mono_get_addr_from_ftnptr (addr);
- if (!mono_method_signature (m)->ret->byref && MONO_TYPE_ISSTRUCT (mono_method_signature (m)->ret))
- this_pos = 4;
-
mono_domain_lock (domain);
- start = code = mono_code_manager_reserve (domain->code_mp, 20);
+ start = code = mono_domain_code_reserve (domain, size);
+ code = mono_ppc_create_pre_code_ftnptr (code);
+ short_branch = branch_for_target_reachable (code + 4, addr);
+ if (short_branch)
+ mono_domain_code_commit (domain, code, size, 8);
mono_domain_unlock (domain);
- ppc_load (code, ppc_r0, addr);
- ppc_mtctr (code, ppc_r0);
- ppc_addi (code, this_pos, this_pos, sizeof (MonoObject));
- ppc_bcctr (code, 20, 0);
+ if (short_branch) {
+ ppc_addi (code, this_pos, this_pos, sizeof (MonoObject));
+ ppc_emit32 (code, short_branch);
+ } else {
+ ppc_load_ptr (code, ppc_r0, addr);
+ ppc_mtctr (code, ppc_r0);
+ ppc_addi (code, this_pos, this_pos, sizeof (MonoObject));
+ ppc_bcctr (code, 20, 0);
+ }
mono_arch_flush_icache (start, code - start);
- g_assert ((code - start) <= 20);
+ g_assert ((code - start) <= size);
/*g_print ("unbox trampoline at %d for %s:%s\n", this_pos, m->klass->name, m->name);
g_print ("unbox code is at %p for method at %p\n", start, addr);*/
return start;
}
-/* Stack size for trampoline function
- * PPC_MINIMAL_STACK_SIZE + 16 (args + alignment to ppc_magic_trampoline)
- * + MonoLMF + 14 fp regs + 13 gregs + alignment
- * #define STACK (PPC_MINIMAL_STACK_SIZE + 4 * sizeof (gulong) + sizeof (MonoLMF) + 14 * sizeof (double) + 13 * (sizeof (gulong)))
- * STACK would be 444 for 32 bit darwin
- */
-#define STACK (448)
-
-/* Method-specific trampoline code fragment size */
-#define METHOD_TRAMPOLINE_SIZE 64
-
-/* Jump-specific trampoline code fragment size */
-#define JUMP_TRAMPOLINE_SIZE 64
-
-/**
- * ppc_magic_trampoline:
- * @code: pointer into caller code
- * @method: the method to translate
- * @sp: stack pointer
+/*
+ * mono_arch_get_static_rgctx_trampoline:
*
- * This method is called by the function 'arch_create_jit_trampoline', which in
- * turn is called by the trampoline functions for virtual methods.
- * After having called the JIT compiler to compile the method, it inspects the
- * caller code to find the address of the method-specific part of the
- * trampoline vtable slot for this method, updates it with a fragment that calls
- * the newly compiled code and returns this address of the compiled code to
- * 'arch_create_jit_trampoline'
+ * Create a trampoline which sets RGCTX_REG to MRGCTX, then jumps to ADDR.
*/
-static gpointer
-ppc_magic_trampoline (MonoMethod *method, guint32 *code, char *sp)
+gpointer
+mono_arch_get_static_rgctx_trampoline (MonoMethod *m, MonoMethodRuntimeGenericContext *mrgctx, gpointer addr)
{
- char *o = NULL;
- gpointer addr;
- MonoJitInfo *ji, *target_ji;
- int reg, offset = 0;
+ guint8 *code, *start, *p;
+ guint8 imm_buf [128];
+ guint32 short_branch;
+ MonoDomain *domain = mono_domain_get ();
+ int imm_size;
+ int size = MONO_PPC_32_64_CASE (24, (PPC_LOAD_SEQUENCE_LENGTH * 2) + 8) + PPC_FTNPTR_SIZE;
- addr = mono_compile_method(method);
- /*g_print ("method code at %p for %s:%s\n", addr, method->klass->name, method->name);*/
- g_assert(addr);
+ addr = mono_get_addr_from_ftnptr (addr);
- if (!code){
- return addr;
+ /* Compute size of code needed to emit mrgctx */
+ p = imm_buf;
+ ppc_load_ptr (p, MONO_ARCH_RGCTX_REG, mrgctx);
+ imm_size = p - imm_buf;
+
+ mono_domain_lock (domain);
+ start = code = mono_domain_code_reserve (domain, size);
+ code = mono_ppc_create_pre_code_ftnptr (code);
+ short_branch = branch_for_target_reachable (code + imm_size, addr);
+ if (short_branch)
+ mono_domain_code_commit (domain, code, size, imm_size + 4);
+ mono_domain_unlock (domain);
+
+ if (short_branch) {
+ ppc_load_ptr (code, MONO_ARCH_RGCTX_REG, mrgctx);
+ ppc_emit32 (code, short_branch);
+ } else {
+ ppc_load_ptr (code, ppc_r0, addr);
+ ppc_mtctr (code, ppc_r0);
+ ppc_load_ptr (code, MONO_ARCH_RGCTX_REG, mrgctx);
+ ppc_bcctr (code, 20, 0);
}
+ mono_arch_flush_icache (start, code - start);
+ g_assert ((code - start) <= size);
- /* We can't trampoline across domains */
- ji = mono_jit_info_table_find (mono_domain_get (), code);
- target_ji = mono_jit_info_table_find (mono_domain_get (), addr);
- if (!mono_method_same_domain (ji, target_ji))
- return addr;
+ return start;
+}
+
+void
+mono_arch_patch_callsite (guint8 *method_start, guint8 *code_ptr, guint8 *addr)
+{
+ guint32 *code = (guint32*)code_ptr;
+
+ addr = mono_get_addr_from_ftnptr (addr);
- /* Locate the address of the method-specific trampoline. The call using
- the vtable slot that took the processing flow to 'arch_create_jit_trampoline'
- looks something like this:
-
- mtlr rA ; Move rA (a register containing the
- ; target address) to LR
- blrl ; Call function at LR
-
- PowerPC instructions are 32-bit long, which means that a 32-bit target
- address cannot be encoded as an immediate value (because we already
- have spent some bits to encode the branch instruction!). That's why a
- 'b'ranch to the contents of the 'l'ink 'r'egister (with 'l'ink register
- update) is needed, instead of a simpler 'branch immediate'. This
- complicates our purpose here, because 'blrl' overwrites LR, which holds
- the value we're interested in.
-
- Therefore, we need to locate the 'mtlr rA' instruction to know which
- register LR was loaded from, and then retrieve the value from that
- register */
-
/* This is the 'blrl' instruction */
--code;
*/
if (((*code) >> 26) == 18) {
/*g_print ("direct patching\n");*/
- ppc_patch ((char*)code, addr);
- mono_arch_flush_icache ((char*)code, 4);
- return addr;
+ ppc_patch ((guint8*)code, addr);
+ mono_arch_flush_icache ((guint8*)code, 4);
+ return;
}
- /* Sanity check: instruction must be 'blrl' */
- g_assert(*code == 0x4e800021);
+ /* Sanity check */
+ g_assert (mono_ppc_is_direct_call_sequence (code));
- /* the thunk-less direct call sequence: lis/ori/mtlr/blrl */
- if ((code [-1] >> 26) == 31 && (code [-2] >> 26) == 24 && (code [-3] >> 26) == 15) {
- ppc_patch ((char*)code, addr);
- return addr;
- }
+ ppc_patch ((guint8*)code, addr);
+}
- /* OK, we're now at the 'blrl' instruction. Now walk backwards
- till we get to a 'mtlr rA' */
- for(; --code;) {
- if((*code & 0x7c0803a6) == 0x7c0803a6) {
- gint16 soff;
- gint reg_offset;
- /* Here we are: we reached the 'mtlr rA'.
- Extract the register from the instruction */
- reg = (*code & 0x03e00000) >> 21;
- --code;
- /* ok, this is a lwz reg, offset (vtreg)
- * it is emitted with:
- * ppc_emit32 (c, (32 << 26) | ((D) << 21) | ((a) << 16) | (guint16)(d))
- */
- soff = (*code & 0xffff);
- offset = soff;
- reg = (*code >> 16) & 0x1f;
- g_assert (reg != ppc_r1);
- /*g_print ("patching reg is %d\n", reg);*/
- if (reg >= 13) {
- /* saved in the MonoLMF structure */
- reg_offset = STACK - sizeof (MonoLMF) + G_STRUCT_OFFSET (MonoLMF, iregs);
- reg_offset += (reg - 13) * sizeof (gulong);
- } else {
- /* saved in the stack, see frame diagram below */
- reg_offset = STACK - sizeof (MonoLMF) - (14 * sizeof (double)) - (13 * sizeof (gulong));
- reg_offset += reg * sizeof (gulong);
- }
- /* o contains now the value of register reg */
- o = *((char**) (sp + reg_offset));
- break;
- }
- }
+void
+mono_arch_patch_plt_entry (guint8 *code, gpointer *got, mgreg_t *regs, guint8 *addr)
+{
+ guint32 ins1, ins2, offset;
- /* this is not done for non-virtual calls, because in that case
- we won't have an object, but the actual pointer to the
- valuetype as the this argument
- */
- if (method->klass->valuetype && !mono_aot_is_got_entry (code, o))
- addr = get_unbox_trampoline (method, addr);
+ /* Patch the jump table entry used by the plt entry */
+
+ /* Should be a lis+ori */
+ ins1 = ((guint32*)code)[0];
+ g_assert (ins1 >> 26 == 15);
+ ins2 = ((guint32*)code)[1];
+ g_assert (ins2 >> 26 == 24);
+ offset = ((ins1 & 0xffff) << 16) | (ins2 & 0xffff);
- o += offset;
- if (mono_aot_is_got_entry (code, o) || mono_domain_owns_vtable_slot (mono_domain_get (), o))
- *((gpointer *)o) = addr;
- return addr;
+ /* Either got or regs is set */
+ if (!got)
+ got = (gpointer*)(gsize) regs [30];
+ *(guint8**)((guint8*)got + offset) = addr;
}
-static void
-ppc_class_init_trampoline (void *vtable, guint32 *code, char *sp)
+void
+mono_arch_nullify_class_init_trampoline (guint8 *code, mgreg_t *regs)
{
- mono_runtime_class_init (vtable);
+ mono_arch_patch_callsite (NULL, code, nullified_class_init_trampoline);
+}
-#if 0
- /* This is the 'bl' instruction */
- --code;
-
- if (((*code) >> 26) == 18) {
- ppc_ori (code, 0, 0, 0); /* nop */
- mono_arch_flush_icache (code, 4);
- return;
- } else {
- g_assert_not_reached ();
- }
-#endif
+void
+mono_arch_nullify_plt_entry (guint8 *code, mgreg_t *regs)
+{
+ if (mono_aot_only && !nullified_class_init_trampoline)
+ nullified_class_init_trampoline = mono_aot_get_trampoline ("nullified_class_init_trampoline");
+
+ mono_arch_patch_plt_entry (code, NULL, regs, nullified_class_init_trampoline);
}
+/* Stack size for trampoline function
+ * PPC_MINIMAL_STACK_SIZE + 16 (args + alignment to ppc_magic_trampoline)
+ * + MonoLMF + 14 fp regs + 13 gregs + alignment
+ */
+#define STACK (((PPC_MINIMAL_STACK_SIZE + 4 * sizeof (mgreg_t) + sizeof (MonoLMF) + 14 * sizeof (double) + 31 * sizeof (mgreg_t)) + (MONO_ARCH_FRAME_ALIGNMENT - 1)) & ~(MONO_ARCH_FRAME_ALIGNMENT - 1))
+
+/* Method-specific trampoline code fragment size */
+#define METHOD_TRAMPOLINE_SIZE 64
+
+/* Jump-specific trampoline code fragment size */
+#define JUMP_TRAMPOLINE_SIZE 64
+
+#ifdef PPC_USES_FUNCTION_DESCRIPTOR
+#define PPC_TOC_REG ppc_r2
+#else
+#define PPC_TOC_REG -1
+#endif
+
/*
* Stack frame description when the generic trampoline is called.
* caller frame
* -------------------
* Saved FP registers 0-13
* -------------------
- * Saved general registers 0-12
+ * Saved general registers 0-30
* -------------------
* param area for 3 args to ppc_magic_trampoline
* -------------------
* -------------------
*/
guchar*
-mono_arch_create_trampoline_code (MonoTrampolineType tramp_type)
+mono_arch_create_generic_trampoline (MonoTrampolineType tramp_type, MonoTrampInfo **info, gboolean aot)
{
+
guint8 *buf, *code = NULL;
int i, offset;
+ gconstpointer tramp_handler;
+ int size = MONO_PPC_32_64_CASE (600, 800);
+ GSList *unwind_ops = NULL;
+ MonoJumpInfo *ji = NULL;
- if(!code) {
- /* Now we'll create in 'buf' the PowerPC trampoline code. This
- is the trampoline code common to all methods */
-
- code = buf = mono_global_codeman_reserve (512);
-
- ppc_stwu (buf, ppc_r1, -STACK, ppc_r1);
-
- /* start building the MonoLMF on the stack */
- offset = STACK - sizeof (double) * MONO_SAVED_FREGS;
- for (i = 14; i < 32; i++) {
- ppc_stfd (buf, i, offset, ppc_r1);
- offset += sizeof (double);
- }
- /*
- * now the integer registers. r13 is already saved in the trampoline,
- * and at this point contains the method to compile, so we skip it.
- */
- offset = STACK - sizeof (MonoLMF) + G_STRUCT_OFFSET (MonoLMF, iregs) + sizeof (gulong);
- ppc_stmw (buf, ppc_r14, ppc_r1, offset);
-
- /* Now save the rest of the registers below the MonoLMF struct, first 14
- * fp regs and then the 13 gregs.
- */
- offset = STACK - sizeof (MonoLMF) - (14 * sizeof (double));
- for (i = 0; i < 14; i++) {
- ppc_stfd (buf, i, offset, ppc_r1);
- offset += sizeof (double);
- }
- offset = STACK - sizeof (MonoLMF) - (14 * sizeof (double)) - (13 * sizeof (gulong));
- for (i = 0; i < 13; i++) {
- ppc_stw (buf, i, offset, ppc_r1);
- offset += sizeof (gulong);
- }
- /* we got here through a jump to the ctr reg, we must save the lr
- * in the parent frame (we do it here to reduce the size of the
- * method-specific trampoline)
- */
- ppc_mflr (buf, ppc_r0);
- ppc_stw (buf, ppc_r0, STACK + PPC_RET_ADDR_OFFSET, ppc_r1);
-
- /* ok, now we can continue with the MonoLMF setup, mostly untouched
- * from emit_prolog in mini-ppc.c
- */
- ppc_load (buf, ppc_r0, mono_get_lmf_addr);
- ppc_mtlr (buf, ppc_r0);
- ppc_blrl (buf);
- /* we build the MonoLMF structure on the stack - see mini-ppc.h
- * The pointer to the struct is put in ppc_r11.
- */
- ppc_addi (buf, ppc_r11, ppc_sp, STACK - sizeof (MonoLMF));
- ppc_stw (buf, ppc_r3, G_STRUCT_OFFSET(MonoLMF, lmf_addr), ppc_r11);
- /* new_lmf->previous_lmf = *lmf_addr */
- ppc_lwz (buf, ppc_r0, G_STRUCT_OFFSET(MonoLMF, previous_lmf), ppc_r3);
- ppc_stw (buf, ppc_r0, G_STRUCT_OFFSET(MonoLMF, previous_lmf), ppc_r11);
- /* *(lmf_addr) = r11 */
- ppc_stw (buf, ppc_r11, G_STRUCT_OFFSET(MonoLMF, previous_lmf), ppc_r3);
- /* save method info (it's in r13) */
- ppc_stw (buf, ppc_r13, G_STRUCT_OFFSET(MonoLMF, method), ppc_r11);
- ppc_stw (buf, ppc_sp, G_STRUCT_OFFSET(MonoLMF, ebp), ppc_r11);
- /* save the IP (caller ip) */
- if (tramp_type == MONO_TRAMPOLINE_JUMP) {
- ppc_li (buf, ppc_r0, 0);
- } else {
- ppc_lwz (buf, ppc_r0, STACK + PPC_RET_ADDR_OFFSET, ppc_r1);
- }
- ppc_stw (buf, ppc_r0, G_STRUCT_OFFSET(MonoLMF, eip), ppc_r11);
-
- /*
- * Now we're ready to call ppc_magic_trampoline ().
- */
- /* Arg 1: MonoMethod *method. It was put in r13 */
- ppc_mr (buf, ppc_r3, ppc_r13);
-
- /* Arg 2: code (next address to the instruction that called us) */
- if (tramp_type == MONO_TRAMPOLINE_JUMP) {
- ppc_li (buf, ppc_r4, 0);
- } else {
- ppc_lwz (buf, ppc_r4, STACK + PPC_RET_ADDR_OFFSET, ppc_r1);
- }
-
- /* Arg 3: stack pointer so that the magic trampoline can access the
- * registers we saved above
- */
- ppc_mr (buf, ppc_r5, ppc_r1);
+ /* Now we'll create in 'buf' the PowerPC trampoline code. This
+ is the trampoline code common to all methods */
+
+ code = buf = mono_global_codeman_reserve (size);
+
+ ppc_str_update (code, ppc_r1, -STACK, ppc_r1);
+
+ /* start building the MonoLMF on the stack */
+ offset = STACK - sizeof (double) * MONO_SAVED_FREGS;
+ for (i = 14; i < 32; i++) {
+ ppc_stfd (code, i, offset, ppc_r1);
+ offset += sizeof (double);
+ }
+ /*
+ * now the integer registers.
+ */
+ offset = STACK - sizeof (MonoLMF) + G_STRUCT_OFFSET (MonoLMF, iregs);
+ ppc_str_multiple (code, ppc_r13, offset, ppc_r1);
+
+ /* Now save the rest of the registers below the MonoLMF struct, first 14
+ * fp regs and then the 31 gregs.
+ */
+ offset = STACK - sizeof (MonoLMF) - (14 * sizeof (double));
+ for (i = 0; i < 14; i++) {
+ ppc_stfd (code, i, offset, ppc_r1);
+ offset += sizeof (double);
+ }
+#define GREGS_OFFSET (STACK - sizeof (MonoLMF) - (14 * sizeof (double)) - (31 * sizeof (mgreg_t)))
+ offset = GREGS_OFFSET;
+ for (i = 0; i < 31; i++) {
+ ppc_str (code, i, offset, ppc_r1);
+ offset += sizeof (mgreg_t);
+ }
+
+ /* we got here through a jump to the ctr reg, we must save the lr
+ * in the parent frame (we do it here to reduce the size of the
+ * method-specific trampoline)
+ */
+ ppc_mflr (code, ppc_r0);
+ ppc_str (code, ppc_r0, STACK + PPC_RET_ADDR_OFFSET, ppc_r1);
+
+ /* ok, now we can continue with the MonoLMF setup, mostly untouched
+ * from emit_prolog in mini-ppc.c
+ */
+ if (aot) {
+ code = mono_arch_emit_load_aotconst (buf, code, &ji, MONO_PATCH_INFO_JIT_ICALL_ADDR, "mono_get_lmf_addr");
+#ifdef PPC_USES_FUNCTION_DESCRIPTOR
+ ppc_ldptr (code, ppc_r2, sizeof (gpointer), ppc_r11);
+ ppc_ldptr (code, ppc_r11, 0, ppc_r11);
+#endif
+ ppc_mtlr (code, ppc_r11);
+ ppc_blrl (code);
+ } else {
+ ppc_load_func (code, ppc_r0, mono_get_lmf_addr);
+ ppc_mtlr (code, ppc_r0);
+ ppc_blrl (code);
+ }
+ /* we build the MonoLMF structure on the stack - see mini-ppc.h
+ * The pointer to the struct is put in ppc_r11.
+ */
+ ppc_addi (code, ppc_r11, ppc_sp, STACK - sizeof (MonoLMF));
+ ppc_stptr (code, ppc_r3, G_STRUCT_OFFSET(MonoLMF, lmf_addr), ppc_r11);
+ /* new_lmf->previous_lmf = *lmf_addr */
+ ppc_ldptr (code, ppc_r0, G_STRUCT_OFFSET(MonoLMF, previous_lmf), ppc_r3);
+ ppc_stptr (code, ppc_r0, G_STRUCT_OFFSET(MonoLMF, previous_lmf), ppc_r11);
+ /* *(lmf_addr) = r11 */
+ ppc_stptr (code, ppc_r11, G_STRUCT_OFFSET(MonoLMF, previous_lmf), ppc_r3);
+ /* save method info (it's stored on the stack, so get it first). */
+ if ((tramp_type == MONO_TRAMPOLINE_JIT) || (tramp_type == MONO_TRAMPOLINE_JUMP)) {
+ ppc_ldr (code, ppc_r0, GREGS_OFFSET, ppc_r1);
+ ppc_stptr (code, ppc_r0, G_STRUCT_OFFSET(MonoLMF, method), ppc_r11);
+ } else {
+ ppc_load (code, ppc_r0, 0);
+ ppc_stptr (code, ppc_r0, G_STRUCT_OFFSET(MonoLMF, method), ppc_r11);
+ }
+ /* store the frame pointer of the calling method */
+ ppc_addi (code, ppc_r0, ppc_sp, STACK);
+ ppc_stptr (code, ppc_r0, G_STRUCT_OFFSET(MonoLMF, ebp), ppc_r11);
+ /* save the IP (caller ip) */
+ if (tramp_type == MONO_TRAMPOLINE_JUMP) {
+ ppc_li (code, ppc_r0, 0);
+ } else {
+ ppc_ldr (code, ppc_r0, STACK + PPC_RET_ADDR_OFFSET, ppc_r1);
+ }
+ ppc_stptr (code, ppc_r0, G_STRUCT_OFFSET(MonoLMF, eip), ppc_r11);
+
+ /*
+ * Now we're ready to call trampoline (mgreg_t *regs, guint8 *code, gpointer value, guint8 *tramp)
+ * Note that the last argument is unused.
+ */
+ /* Arg 1: a pointer to the registers */
+ ppc_addi (code, ppc_r3, ppc_r1, GREGS_OFFSET);
- if (tramp_type == MONO_TRAMPOLINE_CLASS_INIT) {
- ppc_lis (buf, ppc_r0, (guint32) ppc_class_init_trampoline >> 16);
- ppc_ori (buf, ppc_r0, ppc_r0, (guint32) ppc_class_init_trampoline & 0xffff);
- } else {
- ppc_lis (buf, ppc_r0, (guint32) ppc_magic_trampoline >> 16);
- ppc_ori (buf, ppc_r0, ppc_r0, (guint32) ppc_magic_trampoline & 0xffff);
- }
- ppc_mtlr (buf, ppc_r0);
- ppc_blrl (buf);
+ /* Arg 2: code (next address to the instruction that called us) */
+ if (tramp_type == MONO_TRAMPOLINE_JUMP)
+ ppc_li (code, ppc_r4, 0);
+ else
+ ppc_ldr (code, ppc_r4, STACK + PPC_RET_ADDR_OFFSET, ppc_r1);
+
+ /* Arg 3: trampoline argument */
+ if (tramp_type == MONO_TRAMPOLINE_GENERIC_CLASS_INIT)
+ ppc_ldr (code, ppc_r5, GREGS_OFFSET + MONO_ARCH_VTABLE_REG * sizeof (mgreg_t), ppc_r1);
+ else
+ ppc_ldr (code, ppc_r5, GREGS_OFFSET, ppc_r1);
+
+ if (aot) {
+ code = mono_arch_emit_load_aotconst (buf, code, &ji, MONO_PATCH_INFO_JIT_ICALL_ADDR, g_strdup_printf ("trampoline_func_%d", tramp_type));
+#ifdef PPC_USES_FUNCTION_DESCRIPTOR
+ ppc_ldptr (code, ppc_r2, sizeof (gpointer), ppc_r11);
+ ppc_ldptr (code, ppc_r11, 0, ppc_r11);
+#endif
+ ppc_mtlr (code, ppc_r11);
+ ppc_blrl (code);
+ } else {
+ tramp_handler = mono_get_trampoline_func (tramp_type);
+ ppc_load_func (code, ppc_r0, tramp_handler);
+ ppc_mtlr (code, ppc_r0);
+ ppc_blrl (code);
+ }
- /* OK, code address is now on r3. Move it to the counter reg
- * so it will be ready for the final jump: this is safe since we
- * won't do any more calls.
- */
- ppc_mtctr (buf, ppc_r3);
-
- /*
- * Now we restore the MonoLMF (see emit_epilogue in mini-ppc.c)
- * and the rest of the registers, so the method called will see
- * the same state as before we executed.
- * The pointer to MonoLMF is in ppc_r11.
- */
- ppc_addi (buf, ppc_r11, ppc_r1, STACK - sizeof (MonoLMF));
- /* r5 = previous_lmf */
- ppc_lwz (buf, ppc_r5, G_STRUCT_OFFSET(MonoLMF, previous_lmf), ppc_r11);
- /* r6 = lmf_addr */
- ppc_lwz (buf, ppc_r6, G_STRUCT_OFFSET(MonoLMF, lmf_addr), ppc_r11);
- /* *(lmf_addr) = previous_lmf */
- ppc_stw (buf, ppc_r5, G_STRUCT_OFFSET(MonoLMF, previous_lmf), ppc_r6);
- /* restore iregs: this time include r13 */
- ppc_lmw (buf, ppc_r13, ppc_r11, G_STRUCT_OFFSET(MonoLMF, iregs));
- /* restore fregs */
- for (i = 14; i < 32; i++) {
- ppc_lfd (buf, i, G_STRUCT_OFFSET(MonoLMF, fregs) + ((i-14) * sizeof (gdouble)), ppc_r11);
- }
-
- /* restore the volatile registers, we skip r1, of course */
- offset = STACK - sizeof (MonoLMF) - (14 * sizeof (double));
- for (i = 0; i < 14; i++) {
- ppc_lfd (buf, i, offset, ppc_r1);
- offset += sizeof (double);
- }
- offset = STACK - sizeof (MonoLMF) - (14 * sizeof (double)) - (13 * sizeof (gulong));
- ppc_lwz (buf, ppc_r0, offset, ppc_r1);
- offset += 2 * sizeof (gulong);
- for (i = 2; i < 13; i++) {
- ppc_lwz (buf, i, offset, ppc_r1);
- offset += sizeof (gulong);
- }
-
- /* Non-standard function epilogue. Instead of doing a proper
- * return, we just hump to the compiled code.
- */
- /* Restore stack pointer and LR and jump to the code */
- ppc_lwz (buf, ppc_r1, 0, ppc_r1);
- ppc_lwz (buf, ppc_r11, PPC_RET_ADDR_OFFSET, ppc_r1);
- ppc_mtlr (buf, ppc_r11);
- ppc_bcctr (buf, 20, 0);
-
- /* Flush instruction cache, since we've generated code */
- mono_arch_flush_icache (code, buf - code);
+ /* OK, code address is now on r3. Move it to the counter reg
+ * so it will be ready for the final jump: this is safe since we
+ * won't do any more calls.
+ */
+ if (!MONO_TRAMPOLINE_TYPE_MUST_RETURN (tramp_type)) {
+#ifdef PPC_USES_FUNCTION_DESCRIPTOR
+ ppc_ldptr (code, ppc_r2, sizeof (gpointer), ppc_r3);
+ ppc_ldptr (code, ppc_r3, 0, ppc_r3);
+#endif
+ ppc_mtctr (code, ppc_r3);
+ }
+
+ /*
+ * Now we restore the MonoLMF (see emit_epilogue in mini-ppc.c)
+ * and the rest of the registers, so the method called will see
+ * the same state as before we executed.
+ * The pointer to MonoLMF is in ppc_r11.
+ */
+ ppc_addi (code, ppc_r11, ppc_r1, STACK - sizeof (MonoLMF));
+ /* r5 = previous_lmf */
+ ppc_ldptr (code, ppc_r5, G_STRUCT_OFFSET(MonoLMF, previous_lmf), ppc_r11);
+ /* r6 = lmf_addr */
+ ppc_ldptr (code, ppc_r6, G_STRUCT_OFFSET(MonoLMF, lmf_addr), ppc_r11);
+ /* *(lmf_addr) = previous_lmf */
+ ppc_stptr (code, ppc_r5, G_STRUCT_OFFSET(MonoLMF, previous_lmf), ppc_r6);
+ /* restore iregs */
+ ppc_ldr_multiple (code, ppc_r13, G_STRUCT_OFFSET(MonoLMF, iregs), ppc_r11);
+ /* restore fregs */
+ for (i = 14; i < 32; i++)
+ ppc_lfd (code, i, G_STRUCT_OFFSET(MonoLMF, fregs) + ((i-14) * sizeof (gdouble)), ppc_r11);
+
+ /* restore the volatile registers, we skip r1, of course */
+ offset = STACK - sizeof (MonoLMF) - (14 * sizeof (double));
+ for (i = 0; i < 14; i++) {
+ ppc_lfd (code, i, offset, ppc_r1);
+ offset += sizeof (double);
+ }
+ offset = STACK - sizeof (MonoLMF) - (14 * sizeof (double)) - (31 * sizeof (mgreg_t));
+ ppc_ldr (code, ppc_r0, offset, ppc_r1);
+ offset += 2 * sizeof (mgreg_t);
+ for (i = 2; i < 13; i++) {
+ if (i != PPC_TOC_REG && (i != 3 || tramp_type != MONO_TRAMPOLINE_RGCTX_LAZY_FETCH))
+ ppc_ldr (code, i, offset, ppc_r1);
+ offset += sizeof (mgreg_t);
+ }
+
+ /* Non-standard function epilogue. Instead of doing a proper
+ * return, we just jump to the compiled code.
+ */
+ /* Restore stack pointer and LR and jump to the code */
+ ppc_ldr (code, ppc_r1, 0, ppc_r1);
+ ppc_ldr (code, ppc_r11, PPC_RET_ADDR_OFFSET, ppc_r1);
+ ppc_mtlr (code, ppc_r11);
+ if (MONO_TRAMPOLINE_TYPE_MUST_RETURN (tramp_type))
+ ppc_blr (code);
+ else
+ ppc_bcctr (code, 20, 0);
+
+ /* Flush instruction cache, since we've generated code */
+ mono_arch_flush_icache (buf, code - buf);
- /* Sanity check */
- g_assert ((buf - code) <= 512);
+ /* Sanity check */
+ g_assert ((code - buf) <= size);
+
+ if (tramp_type == MONO_TRAMPOLINE_CLASS_INIT) {
+ /* Initialize the nullified class init trampoline */
+ nullified_class_init_trampoline = mono_ppc_create_ftnptr (mono_arch_get_nullified_class_init_trampoline (NULL));
}
- return code;
+ if (info)
+ *info = mono_tramp_info_create (mono_get_generic_trampoline_name (tramp_type), buf, code - buf, ji, unwind_ops);
+
+ return buf;
}
-static MonoJitInfo*
-create_specific_tramp (MonoMethod *method, guint8* tramp, MonoDomain *domain) {
- guint8 *code, *buf;
- MonoJitInfo *ji;
+#define TRAMPOLINE_SIZE (MONO_PPC_32_64_CASE (24, (5+5+1+1)*4))
+gpointer
+mono_arch_create_specific_trampoline (gpointer arg1, MonoTrampolineType tramp_type, MonoDomain *domain, guint32 *code_len)
+{
+ guint8 *code, *buf, *tramp;
+ guint32 short_branch;
+
+ tramp = mono_get_trampoline_code (tramp_type);
mono_domain_lock (domain);
- code = buf = mono_code_manager_reserve (domain->code_mp, 32);
+ code = buf = mono_domain_code_reserve_align (domain, TRAMPOLINE_SIZE, 4);
+ short_branch = branch_for_target_reachable (code + MONO_PPC_32_64_CASE (8, 5*4), tramp);
+#ifdef __mono_ppc64__
+ /* FIXME: make shorter if possible */
+#else
+ if (short_branch)
+ mono_domain_code_commit (domain, code, TRAMPOLINE_SIZE, 12);
+#endif
mono_domain_unlock (domain);
- /* Save r13 in the place it will have in the on-stack MonoLMF */
- ppc_stw (buf, ppc_r13, -(MONO_SAVED_FREGS * 8 + MONO_SAVED_GREGS * sizeof (gpointer)), ppc_r1);
-
- /* Prepare the jump to the generic trampoline code.*/
- ppc_lis (buf, ppc_r13, (guint32) tramp >> 16);
- ppc_ori (buf, ppc_r13, ppc_r13, (guint32) tramp & 0xffff);
- ppc_mtctr (buf, ppc_r13);
+ if (short_branch) {
+ ppc_load_sequence (code, ppc_r0, (mgreg_t)(gsize) arg1);
+ ppc_emit32 (code, short_branch);
+ } else {
+ /* Prepare the jump to the generic trampoline code.*/
+ ppc_load_ptr (code, ppc_r0, tramp);
+ ppc_mtctr (code, ppc_r0);
- /* And finally put 'method' in r13 and fly! */
- ppc_lis (buf, ppc_r13, (guint32) method >> 16);
- ppc_ori (buf, ppc_r13, ppc_r13, (guint32) method & 0xffff);
- ppc_bcctr (buf, 20, 0);
+ /* And finally put 'arg1' in r0 and fly! */
+ ppc_load_ptr (code, ppc_r0, arg1);
+ ppc_bcctr (code, 20, 0);
+ }
/* Flush instruction cache, since we've generated code */
- mono_arch_flush_icache (code, buf - code);
-
- g_assert ((buf - code) <= 32);
+ mono_arch_flush_icache (buf, code - buf);
- ji = g_new0 (MonoJitInfo, 1);
- ji->method = method;
- ji->code_start = code;
- ji->code_size = buf - code;
+ g_assert ((code - buf) <= TRAMPOLINE_SIZE);
- mono_jit_stats.method_trampolines++;
+ if (code_len)
+ *code_len = code - buf;
- return ji;
+ return buf;
}
-MonoJitInfo*
-mono_arch_create_jump_trampoline (MonoMethod *method)
+static guint8*
+emit_trampoline_jump (guint8 *code, guint8 *tramp)
{
- guint8 *tramp;
- MonoDomain* domain = mono_domain_get ();
-
- tramp = mono_get_trampoline_code (MONO_TRAMPOLINE_JUMP);
- return create_specific_tramp (method, tramp, domain);
+ guint32 short_branch = branch_for_target_reachable (code, tramp);
+
+ /* FIXME: we can save a few bytes here by committing if the
+ short branch is possible */
+ if (short_branch) {
+ ppc_emit32 (code, short_branch);
+ } else {
+ ppc_load_ptr (code, ppc_r0, tramp);
+ ppc_mtctr (code, ppc_r0);
+ ppc_bcctr (code, 20, 0);
+ }
+
+ return code;
}
-/**
- * arch_create_jit_trampoline:
- * @method: pointer to the method info
- *
- * Creates a trampoline function for virtual methods. If the created
- * code is called it first starts JIT compilation of method,
- * and then calls the newly created method. It also replaces the
- * corresponding vtable entry (see ppc_magic_trampoline).
- *
- * A trampoline consists of two parts: a main fragment, shared by all method
- * trampolines, and some code specific to each method, which hard-codes a
- * reference to that method and then calls the main fragment.
- *
- * The main fragment contains a call to 'ppc_magic_trampoline', which performs
- * call to the JIT compiler and substitutes the method-specific fragment with
- * some code that directly calls the JIT-compiled method.
- *
- * Returns: a pointer to the newly created code
- */
gpointer
-mono_arch_create_jit_trampoline (MonoMethod *method)
+mono_arch_create_rgctx_lazy_fetch_trampoline (guint32 slot, MonoTrampInfo **info, gboolean aot)
{
+#ifdef MONO_ARCH_VTABLE_REG
guint8 *tramp;
- MonoJitInfo *ji;
- MonoDomain* domain = mono_domain_get ();
- gpointer code_start;
+ guint8 *code, *buf;
+ guint8 **rgctx_null_jumps;
+ int tramp_size;
+ int depth, index;
+ int i;
+ gboolean mrgctx;
+ MonoJumpInfo *ji = NULL;
+ GSList *unwind_ops = NULL;
+
+ mrgctx = MONO_RGCTX_SLOT_IS_MRGCTX (slot);
+ index = MONO_RGCTX_SLOT_INDEX (slot);
+ if (mrgctx)
+ index += MONO_SIZEOF_METHOD_RUNTIME_GENERIC_CONTEXT / sizeof (gpointer);
+ for (depth = 0; ; ++depth) {
+ int size = mono_class_rgctx_get_array_size (depth, mrgctx);
+
+ if (index < size - 1)
+ break;
+ index -= size - 1;
+ }
+
+ tramp_size = MONO_PPC_32_64_CASE (40, 52) + 12 * depth;
+ if (mrgctx)
+ tramp_size += 4;
+ else
+ tramp_size += 12;
+ if (aot)
+ tramp_size += 32;
+
+ code = buf = mono_global_codeman_reserve (tramp_size);
- tramp = mono_get_trampoline_code (MONO_TRAMPOLINE_GENERIC);
- /* FIXME: should pass the domain down to this function */
- ji = create_specific_tramp (method, tramp, domain);
- code_start = ji->code_start;
- g_free (ji);
+ rgctx_null_jumps = g_malloc (sizeof (guint8*) * (depth + 2));
+
+ if (mrgctx) {
+ /* get mrgctx ptr */
+ ppc_mr (code, ppc_r4, PPC_FIRST_ARG_REG);
+ } else {
+ /* load rgctx ptr from vtable */
+ ppc_ldptr (code, ppc_r4, G_STRUCT_OFFSET (MonoVTable, runtime_generic_context), PPC_FIRST_ARG_REG);
+ /* is the rgctx ptr null? */
+ ppc_compare_reg_imm (code, 0, ppc_r4, 0);
+ /* if yes, jump to actual trampoline */
+ rgctx_null_jumps [0] = code;
+ ppc_bc (code, PPC_BR_TRUE, PPC_BR_EQ, 0);
+ }
- return code_start;
+ for (i = 0; i < depth; ++i) {
+ /* load ptr to next array */
+ if (mrgctx && i == 0)
+ ppc_ldptr (code, ppc_r4, MONO_SIZEOF_METHOD_RUNTIME_GENERIC_CONTEXT, ppc_r4);
+ else
+ ppc_ldptr (code, ppc_r4, 0, ppc_r4);
+ /* is the ptr null? */
+ ppc_compare_reg_imm (code, 0, ppc_r4, 0);
+ /* if yes, jump to actual trampoline */
+ rgctx_null_jumps [i + 1] = code;
+ ppc_bc (code, PPC_BR_TRUE, PPC_BR_EQ, 0);
+ }
+
+ /* fetch slot */
+ ppc_ldptr (code, ppc_r4, sizeof (gpointer) * (index + 1), ppc_r4);
+ /* is the slot null? */
+ ppc_compare_reg_imm (code, 0, ppc_r4, 0);
+ /* if yes, jump to actual trampoline */
+ rgctx_null_jumps [depth + 1] = code;
+ ppc_bc (code, PPC_BR_TRUE, PPC_BR_EQ, 0);
+ /* otherwise return r4 */
+ /* FIXME: if we use r3 as the work register we can avoid this copy */
+ ppc_mr (code, ppc_r3, ppc_r4);
+ ppc_blr (code);
+
+ for (i = mrgctx ? 1 : 0; i <= depth + 1; ++i)
+ ppc_patch (rgctx_null_jumps [i], code);
+
+ g_free (rgctx_null_jumps);
+
+ /* move the rgctx pointer to the VTABLE register */
+ ppc_mr (code, MONO_ARCH_VTABLE_REG, ppc_r3);
+
+ if (aot) {
+ code = mono_arch_emit_load_aotconst (buf, code, &ji, MONO_PATCH_INFO_JIT_ICALL_ADDR, g_strdup_printf ("specific_trampoline_lazy_fetch_%u", slot));
+ /* Branch to the trampoline */
+#ifdef PPC_USES_FUNCTION_DESCRIPTOR
+ ppc_ldptr (code, ppc_r11, 0, ppc_r11);
+#endif
+ ppc_mtctr (code, ppc_r11);
+ ppc_bcctr (code, PPC_BR_ALWAYS, 0);
+ } else {
+ tramp = mono_arch_create_specific_trampoline (GUINT_TO_POINTER (slot),
+ MONO_TRAMPOLINE_RGCTX_LAZY_FETCH, mono_get_root_domain (), NULL);
+
+ /* jump to the actual trampoline */
+ code = emit_trampoline_jump (code, tramp);
+ }
+
+ mono_arch_flush_icache (buf, code - buf);
+
+ g_assert (code - buf <= tramp_size);
+
+ if (info)
+ *info = mono_tramp_info_create (mono_get_rgctx_fetch_trampoline_name (slot), buf, code - buf, ji, unwind_ops);
+
+ return buf;
+#else
+ g_assert_not_reached ();
+#endif
}
-/**
- * mono_arch_create_class_init_trampoline:
- * @vtable: the type to initialize
- *
- * Creates a trampoline function to run a type initializer.
- * If the trampoline is called, it calls mono_runtime_class_init with the
- * given vtable, then patches the caller code so it does not get called any
- * more.
- *
- * Returns: a pointer to the newly created code
- */
gpointer
-mono_arch_create_class_init_trampoline (MonoVTable *vtable)
+mono_arch_create_generic_class_init_trampoline (MonoTrampInfo **info, gboolean aot)
{
- guint8 *code, *buf, *tramp;
+ guint8 *tramp;
+ guint8 *code, *buf;
+ static int byte_offset = -1;
+ static guint8 bitmask;
+ guint8 *jump;
+ int tramp_size;
+ GSList *unwind_ops = NULL;
+ MonoJumpInfo *ji = NULL;
- tramp = mono_get_trampoline_code (MONO_TRAMPOLINE_CLASS_INIT);
+ tramp_size = MONO_PPC_32_64_CASE (32, 44);
+ if (aot)
+ tramp_size += 32;
- /* This is the method-specific part of the trampoline. Its purpose is
- to provide the generic part with the MonoMethod *method pointer. We'll
- use r11 to keep that value, for instance. However, the generic part of
- the trampoline relies on r11 having the same value it had before coming
- here, so we must save it before. */
- mono_domain_lock (vtable->domain);
- code = buf = mono_code_manager_reserve (vtable->domain->code_mp, METHOD_TRAMPOLINE_SIZE);
- mono_domain_unlock (vtable->domain);
+ code = buf = mono_global_codeman_reserve (tramp_size);
- ppc_mflr (buf, ppc_r4);
- ppc_stw (buf, ppc_r4, PPC_RET_ADDR_OFFSET, ppc_sp);
- ppc_stwu (buf, ppc_sp, -64, ppc_sp);
- ppc_load (buf, ppc_r3, vtable);
- ppc_load (buf, ppc_r5, 0);
+ if (byte_offset < 0)
+ mono_marshal_find_bitfield_offset (MonoVTable, initialized, &byte_offset, &bitmask);
- ppc_load (buf, ppc_r0, ppc_class_init_trampoline);
- ppc_mtlr (buf, ppc_r0);
- ppc_blrl (buf);
+ ppc_lbz (code, ppc_r4, byte_offset, MONO_ARCH_VTABLE_REG);
+ ppc_andid (code, ppc_r4, ppc_r4, bitmask);
+ jump = code;
+ ppc_bc (code, PPC_BR_TRUE, PPC_BR_EQ, 0);
- ppc_lwz (buf, ppc_r0, 64 + PPC_RET_ADDR_OFFSET, ppc_sp);
- ppc_mtlr (buf, ppc_r0);
- ppc_addic (buf, ppc_sp, ppc_sp, 64);
- ppc_blr (buf);
+ ppc_blr (code);
- /* Flush instruction cache, since we've generated code */
- mono_arch_flush_icache (code, buf - code);
-
- /* Sanity check */
- g_assert ((buf - code) <= METHOD_TRAMPOLINE_SIZE);
+ ppc_patch (jump, code);
- mono_jit_stats.method_trampolines++;
+ if (aot) {
+ code = mono_arch_emit_load_aotconst (buf, code, &ji, MONO_PATCH_INFO_JIT_ICALL_ADDR, "specific_trampoline_generic_class_init");
+ /* Branch to the trampoline */
+#ifdef PPC_USES_FUNCTION_DESCRIPTOR
+ ppc_ldptr (code, ppc_r11, 0, ppc_r11);
+#endif
+ ppc_mtctr (code, ppc_r11);
+ ppc_bcctr (code, PPC_BR_ALWAYS, 0);
+ } else {
+ tramp = mono_arch_create_specific_trampoline (NULL, MONO_TRAMPOLINE_GENERIC_CLASS_INIT,
+ mono_get_root_domain (), NULL);
- return code;
+ /* jump to the actual trampoline */
+ code = emit_trampoline_jump (code, tramp);
+ }
+
+ mono_arch_flush_icache (buf, code - buf);
+
+ g_assert (code - buf <= tramp_size);
+
+ if (info)
+ *info = mono_tramp_info_create (g_strdup_printf ("generic_class_init_trampoline"), buf, code - buf, ji, unwind_ops);
+
+ return buf;
}
-/*
- * This method is only called when running in the Mono Debugger.
- */
gpointer
-mono_debugger_create_notification_function (void)
+mono_arch_get_nullified_class_init_trampoline (MonoTrampInfo **info)
{
- guint8 *ptr, *buf;
+ guint8 *code, *buf;
+ guint32 tramp_size = 64;
+
+ code = buf = mono_global_codeman_reserve (tramp_size);
+ ppc_blr (code);
- ptr = buf = mono_global_codeman_reserve (16);
- ppc_break (buf);
- ppc_blr (buf);
- mono_arch_flush_icache (ptr, buf - ptr);
+ mono_arch_flush_icache (buf, code - buf);
- return ptr;
+ g_assert (code - buf <= tramp_size);
+
+ if (info)
+ *info = mono_tramp_info_create (g_strdup_printf ("nullified_class_init_trampoline"), buf, code - buf, NULL, NULL);
+
+ return buf;
+}
+
+guint8*
+mono_arch_get_call_target (guint8 *code)
+{
+ /* Should be a bl */
+ guint32 ins = ((guint32*)(gpointer)code) [-1];
+
+ if ((ins >> 26 == 18) && ((ins & 1) == 1) && ((ins & 2) == 0)) {
+ gint32 disp = (((gint32)ins) >> 2) & 0xffffff;
+ guint8 *target = code - 4 + (disp * 4);
+
+ return target;
+ } else {
+ return NULL;
+ }
}
+guint32
+mono_arch_get_plt_info_offset (guint8 *plt_entry, mgreg_t *regs, guint8 *code)
+{
+#ifdef PPC_USES_FUNCTION_DESCRIPTOR
+ return ((guint32*)plt_entry) [8];
+#else
+ return ((guint32*)plt_entry) [6];
+#endif
+}