* src/vm/vm.c, src/vm/vm.h: Moved to .cpp.
[cacao.git] / src / vm / jit / arm / codegen.c
index 3e803686aa7e281a954af1bc251f726231c3a37b..e7dd2443eb92bedf5f78210861076a8ecb68b008 100644 (file)
@@ -1,9 +1,7 @@
 /* src/vm/jit/arm/codegen.c - machine code generator for Arm
 
-   Copyright (C) 1996-2005, 2006, 2007 R. Grafl, A. Krall, C. Kruegel,
-   C. Oates, R. Obermaisser, M. Platter, M. Probst, S. Ring,
-   E. Steiner, C. Thalinger, D. Thuernbeck, P. Tomsich, C. Ullrich,
-   J. Wenninger, Institut f. Computersprachen - TU Wien
+   Copyright (C) 1996-2005, 2006, 2007, 2008
+   CACAOVM - Verein zur Foerderung der freien virtuellen Maschine CACAO
 
    This file is part of CACAO.
 
@@ -22,8 +20,6 @@
    Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
    02110-1301, USA.
 
-   $Id: codegen.c 7353 2007-02-13 23:14:35Z twisti $
-
 */
 
 
 
 #include "mm/memory.h"
 
+#include "native/localref.h"
 #include "native/native.h"
 
-#if defined(ENABLE_THREADS)
-# include "threads/native/lock.h"
-#endif
+#include "threads/lock-common.h"
 
 #include "vm/builtin.h"
 #include "vm/exceptions.h"
 #include "vm/global.h"
-#include "vm/vm.h"
+#include "vm/vm.hpp"
 
+#include "vm/jit/abi.h"
 #include "vm/jit/asmpart.h"
 #include "vm/jit/codegen-common.h"
 #include "vm/jit/dseg.h"
 #include "vm/jit/emit-common.h"
 #include "vm/jit/jit.h"
-#include "vm/jit/md.h"
+#include "vm/jit/linenumbertable.h"
 #include "vm/jit/methodheader.h"
 #include "vm/jit/parse.h"
-#include "vm/jit/patcher.h"
+#include "vm/jit/patcher-common.h"
 #include "vm/jit/reg.h"
 
 #if defined(ENABLE_LSRA)
 #include "vmcore/options.h"
 
 
-/* codegen *********************************************************************
+/* codegen_emit ****************************************************************
 
    Generates machine code.
 
 *******************************************************************************/
 
-bool codegen(jitdata *jd)
+bool codegen_emit(jitdata *jd)
 {
        methodinfo         *m;
        codeinfo           *code;
@@ -89,9 +85,6 @@ bool codegen(jitdata *jd)
        varinfo        *var;
        basicblock     *bptr;
        instruction    *iptr;
-       exception_entry *ex;
-       s4              fieldtype;
-       s4              varindex;
 
        s4              spilledregs_num;
        s4              savedregs_num;
@@ -102,6 +95,10 @@ bool codegen(jitdata *jd)
        unresolved_method  *um;
        builtintable_entry *bte;
        methoddesc         *md;
+       fieldinfo          *fi;
+       unresolved_field   *uf;
+       int                 fieldtype;
+       int                 varindex;
 
        /* get required compiler data */
 
@@ -120,64 +117,50 @@ bool codegen(jitdata *jd)
        
        /* space to save used callee saved registers */
 
-       savedregs_num = (jd->isleafmethod) ? 0 : 1;       /* space to save the LR */
+       savedregs_num = code_is_leafmethod(code) ? 0 : 1; /* space to save the LR */
+
        savedregs_num += (INT_SAV_CNT - rd->savintreguse);
-       savedregs_num += (FLT_SAV_CNT - rd->savfltreguse);
+       /*savedregs_num += (FLT_SAV_CNT - rd->savfltreguse);*/
+       assert((FLT_SAV_CNT - rd->savfltreguse) == 0);
 
        spilledregs_num = rd->memuse;
 
 #if defined(ENABLE_THREADS)        /* space to save argument of monitor_enter */
-       if (checksync && (m->flags & ACC_SYNCHRONIZED))
+       if (checksync && code_is_synchronized(code))
                spilledregs_num++;
 #endif
 
-       cd->stackframesize = spilledregs_num + savedregs_num;
+       cd->stackframesize = spilledregs_num * 8 + savedregs_num * 4;
 
        /* XXX QUICK FIX: We shouldn't align the stack in Java code, but
           only in native stubs. */
        /* align stack to 8-byte */
 
-       cd->stackframesize = (cd->stackframesize + 1) & ~1;
+       cd->stackframesize = (cd->stackframesize + 4) & ~4;
 
        /* SECTION: Method Header */
        /* create method header */
 
        (void) dseg_add_unique_address(cd, code);              /* CodeinfoPointer */
-       (void) dseg_add_unique_s4(cd, cd->stackframesize * 4); /* FrameSize       */
+       (void) dseg_add_unique_s4(cd, cd->stackframesize);     /* FrameSize       */
 
-#if defined(ENABLE_THREADS)
-       /* IsSync contains the offset relative to the stack pointer for the
-          argument of monitor_exit used in the exception handler. Since the
-          offset could be zero and give a wrong meaning of the flag it is
-          offset by one.
-       */
-
-       if (checksync && (m->flags & ACC_SYNCHRONIZED))
-               (void) dseg_add_unique_s4(cd, (rd->memuse + 1) * 4);/* IsSync         */
+       code->synchronizedoffset = rd->memuse * 8;
+
+       /* REMOVEME: We still need it for exception handling in assembler. */
+
+       if (code_is_leafmethod(code))
+               (void) dseg_add_unique_s4(cd, 1);
        else
-#endif
-               (void) dseg_add_unique_s4(cd, 0);                  /* IsSync          */
+               (void) dseg_add_unique_s4(cd, 0);
 
-       (void) dseg_add_unique_s4(cd, jd->isleafmethod);       /* IsLeaf          */
        (void) dseg_add_unique_s4(cd, INT_SAV_CNT - rd->savintreguse); /* IntSave */
        (void) dseg_add_unique_s4(cd, FLT_SAV_CNT - rd->savfltreguse); /* FltSave */
-       (void) dseg_addlinenumbertablesize(cd);
-       (void) dseg_add_unique_s4(cd, jd->exceptiontablelength); /* ExTableSize   */
-
-       /* create exception table */
-
-       for (ex = jd->exceptiontable; ex != NULL; ex = ex->down) {
-               dseg_add_target(cd, ex->start);
-               dseg_add_target(cd, ex->end);
-               dseg_add_target(cd, ex->handler);
-               (void) dseg_add_unique_address(cd, ex->catchtype.any);
-       }
 
        /* save return address and used callee saved registers */
 
        savedregs_bitmask = 0;
 
-       if (!jd->isleafmethod)
+       if (!code_is_leafmethod(code))
                savedregs_bitmask = (1<<REG_LR);
 
        for (i = INT_SAV_CNT - 1; i >= rd->savintreguse; i--)
@@ -195,8 +178,8 @@ bool codegen(jitdata *jd)
 
        /* create additional stack frame for spilled variables (if necessary) */
 
-       if ((cd->stackframesize - savedregs_num) > 0)
-               M_SUB_IMM_EXT_MUL4(REG_SP, REG_SP, cd->stackframesize - savedregs_num);
+       if ((cd->stackframesize / 4 - savedregs_num) > 0)
+               M_SUB_IMM_EXT_MUL4(REG_SP, REG_SP, cd->stackframesize / 4 - savedregs_num);
 
        /* take arguments out of register or stack frame */
 
@@ -216,45 +199,28 @@ bool codegen(jitdata *jd)
 
                /* ATTENTION: we use interger registers for all arguments (even float) */
 #if !defined(ENABLE_SOFTFLOAT)
-               if (IS_INT_LNG_TYPE(t)) {                    /* integer args          */
+               if (IS_INT_LNG_TYPE(t)) {
 #endif
-                       if (!md->params[i].inmemory) {           /* register arguments    */
-                               s2 = ARGUMENT_REGS(t, s1);           /* get argument register */
-                               if (!(var->flags & INMEMORY)) {      /* reg arg -> register   */
-                                       if (GET_LOW_REG(var->vv.regoff) == REG_SPLIT || GET_HIGH_REG(var->vv.regoff) == REG_SPLIT) {
-                                               /* TODO: remove this!!! */
-                                               dolog("SPLIT in local var: %x>%x (%s.%s)", s2, var->vv.regoff, m->class->name->text, m->name->text);
-                                               assert(s2 == var->vv.regoff);
-                                       }
-                                       s3 = var->vv.regoff;
-                                       SPLIT_OPEN(t, s2, REG_ITMP1);
-                                       SPLIT_LOAD(t, s2, cd->stackframesize);
-                                       SPLIT_OPEN(t, s3, REG_ITMP1);
-
+                       if (!md->params[i].inmemory) {
+                               if (!(var->flags & INMEMORY)) {
                                        if (IS_2_WORD_TYPE(t))
-                                               M_LNGMOVE(s2, s3);
+                                               M_LNGMOVE(s1, var->vv.regoff);
                                        else
-                                               M_INTMOVE(s2, s3);
-
-                                       SPLIT_STORE_AND_CLOSE(t, s3, cd->stackframesize);
+                                               M_INTMOVE(s1, var->vv.regoff);
                                }
-                               else {                               /* reg arg -> spilled    */
-                                       SPLIT_OPEN(t, s2, REG_ITMP1);
-                                       SPLIT_LOAD(t, s2, cd->stackframesize);
-
+                               else {
                                        if (IS_2_WORD_TYPE(t))
-                                               M_LST(s2, REG_SP, var->vv.regoff * 4);
+                                               M_LST(s1, REG_SP, var->vv.regoff);
                                        else
-                                               M_IST(s2, REG_SP, var->vv.regoff * 4);
-                                       /* no SPLIT_CLOSE here because arg is fully spilled now */
+                                               M_IST(s1, REG_SP, var->vv.regoff);
                                }
                        }
                        else {                                   /* stack arguments       */
                                if (!(var->flags & INMEMORY)) {      /* stack arg -> register */
                                        if (IS_2_WORD_TYPE(t))
-                                               M_LLD(var->vv.regoff, REG_SP, (cd->stackframesize + s1) * 4);
+                                               M_LLD(var->vv.regoff, REG_SP, cd->stackframesize + s1);
                                        else
-                                               M_ILD(var->vv.regoff, REG_SP, (cd->stackframesize + s1) * 4);
+                                               M_ILD(var->vv.regoff, REG_SP, cd->stackframesize + s1);
                                }
                                else {                               /* stack arg -> spilled  */
                                        /* Reuse Memory Position on Caller Stack */
@@ -262,33 +228,30 @@ bool codegen(jitdata *jd)
                                }
                        }
 #if !defined(ENABLE_SOFTFLOAT)
-               } else {                                     /* floating args         */
-                       if (!md->params[i].inmemory) {           /* register arguments    */
-                               s2 = ARGUMENT_REGS(t, s1);           /* get argument register */
-                               if (!(var->flags & INMEMORY)) {      /* reg arg -> register   */
-                                       SPLIT_OPEN(t, s2, REG_ITMP1);
-                                       SPLIT_LOAD(t, s2, cd->stackframesize);
-                                       M_CAST_INT_TO_FLT_TYPED(t, s2, var->vv.regoff);
+               }
+               else {
+                       if (!md->params[i].inmemory) {
+                               if (!(var->flags & INMEMORY)) {
+                                       if (IS_2_WORD_TYPE(t))
+                                               M_CAST_L2D(s1, var->vv.regoff);
+                                       else
+                                               M_CAST_I2F(s1, var->vv.regoff);
                                }
-                               else {                               /* reg arg -> spilled    */
-                                       SPLIT_OPEN(t, s2, REG_ITMP1);
-                                       SPLIT_LOAD(t, s2, cd->stackframesize);
-
+                               else {
                                        if (IS_2_WORD_TYPE(t))
-                                               M_LST(s2, REG_SP, var->vv.regoff * 4);
+                                               M_LST(s1, REG_SP, var->vv.regoff);
                                        else
-                                               M_IST(s2, REG_SP, var->vv.regoff * 4);
-                                       /* no SPLIT_CLOSE here because arg is fully spilled now */
+                                               M_IST(s1, REG_SP, var->vv.regoff);
                                }
                        }
-                       else {                                   /* stack arguments       */
-                               if (!(var->flags & INMEMORY)) {      /* stack arg -> register */
+                       else {
+                               if (!(var->flags & INMEMORY)) {
                                        if (IS_2_WORD_TYPE(t))
-                                               M_DLD(var->vv.regoff, REG_SP, (cd->stackframesize + s1) * 4);
+                                               M_DLD(var->vv.regoff, REG_SP, cd->stackframesize + s1);
                                        else
-                                               M_FLD(var->vv.regoff, REG_SP, (cd->stackframesize + s1) * 4);
+                                               M_FLD(var->vv.regoff, REG_SP, cd->stackframesize + s1);
                                }
-                               else {                               /* stack arg -> spilled  */
+                               else {
                                        /* Reuse Memory Position on Caller Stack */
                                        var->vv.regoff = cd->stackframesize + s1;
                                }
@@ -300,31 +263,29 @@ bool codegen(jitdata *jd)
 #if defined(ENABLE_THREADS)
        /* call monitorenter function */
 
-       if (checksync && (m->flags & ACC_SYNCHRONIZED)) {
+       if (checksync && code_is_synchronized(code)) {
                /* stack offset for monitor argument */
 
-               s1 = rd->memuse;
+               s1 = rd->memuse * 8;
 
 # if !defined(NDEBUG)
                if (JITDATA_HAS_FLAG_VERBOSECALL(jd)) {
                        M_STMFD(BITMASK_ARGS, REG_SP);
-                       s1 += 4;
+                       s1 += 4 * 4;
                }
 # endif
 
                /* get the correct lock object */
 
                if (m->flags & ACC_STATIC) {
-                       disp = dseg_add_address(cd, &m->class->object.header);
+                       disp = dseg_add_address(cd, &m->clazz->object.header);
                        M_DSEG_LOAD(REG_A0, disp);
                }
                else {
-                       M_TST(REG_A0, REG_A0);
-                       M_BEQ(0);
-                       codegen_add_nullpointerexception_ref(cd);
+                       emit_nullpointer_check_force(cd, iptr, REG_A0);
                }
 
-               M_STR(REG_A0, REG_SP, s1 * 4);
+               M_STR(REG_A0, REG_SP, s1);
                disp = dseg_add_functionptr(cd, LOCK_monitor_enter);
                M_DSEG_BRANCH(disp);
                s1 = (s4) (cd->mcodeptr - cd->mcodebase);
@@ -346,6 +307,9 @@ bool codegen(jitdata *jd)
 
        /* end of header generation */
 
+       /* create replacement points */
+       REPLACEMENT_POINTS_INIT(cd, jd);
+
        /* SECTION: ICMD Code Generation */
        /* for all basic blocks */
 
@@ -362,6 +326,9 @@ bool codegen(jitdata *jd)
 
                codegen_resolve_branchrefs(cd, bptr);
 
+               /* handle replacement points */
+               REPLACEMENT_POINT_BLOCK_START(cd, bptr);
+
                /* copy interface registers to their destination */
 
                len = bptr->indepth;
@@ -408,18 +375,21 @@ bool codegen(jitdata *jd)
 
                        /* add line number */
                        if (iptr->line != currentline) {
-                               dseg_addlinenumber(cd, iptr->line);
+                               linenumbertable_list_entry_add(cd, iptr->line);
                                currentline = iptr->line;
                        }
 
                        MCODECHECK(64);   /* an instruction usually needs < 64 words      */
 
-                       /* the big switch */
-                       switch (iptr->opc) {
-               case ICMD_NOP:        /* ... ==> ...                                  */
+               /* the big switch */
+               switch (iptr->opc) {
+
+               case ICMD_NOP:        /* ...  ==> ...                                 */
+               case ICMD_POP:        /* ..., value  ==> ...                          */
+               case ICMD_POP2:       /* ..., value, value  ==> ...                   */
                        break;
 
-       /* constant operations ************************************************/
+               /* constant operations ************************************************/
 
                case ICMD_ICONST:     /* ...  ==> ..., constant                       */
 
@@ -434,12 +404,8 @@ bool codegen(jitdata *jd)
                        if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
                                disp = dseg_add_unique_address(cd, NULL);
 
-                               codegen_addpatchref(cd, PATCHER_aconst,
-                                                   iptr->sx.val.c.ref,
-                                                                       disp);
-
-                               if (opt_showdisassemble)
-                                       M_NOP;
+                               patcher_add_patch_ref(jd, PATCHER_resolve_classref_to_classinfo,
+                                                   iptr->sx.val.c.ref, disp);
 
                                M_DSEG_LOAD(d, disp);
                        }
@@ -497,21 +463,13 @@ bool codegen(jitdata *jd)
                case ICMD_COPY:
                case ICMD_MOVE:
 
-                       emit_copy(jd, iptr, VAROP(iptr->s1), VAROP(iptr->dst));
+                       emit_copy(jd, iptr);
                        break;
 
                case ICMD_ASTORE:
-                       if (!(iptr->flags.bits & INS_FLAG_RETADDR))
-                               emit_copy(jd, iptr, VAROP(iptr->s1), VAROP(iptr->dst));
-                       break;
-
-               /* pop operations *****************************************************/
-
-               /* attention: double and longs are only one entry in CACAO ICMDs      */
-
-               case ICMD_POP:        /* ..., value  ==> ...                          */
-               case ICMD_POP2:       /* ..., value, value  ==> ...                   */
 
+                       if (!(iptr->flags.bits & INS_FLAG_RETADDR))
+                               emit_copy(jd, iptr);
                        break;
 
 
@@ -712,7 +670,7 @@ bool codegen(jitdata *jd)
 
                        s1 = emit_load_s1(jd, iptr, REG_A0);
                        s2 = emit_load_s2(jd, iptr, REG_A1);
-                       gen_div_check(VAROP(iptr->sx.s23.s2)->type, s2);
+                       emit_arithmetic_check(cd, iptr, s2);
 
                        /* move arguments into argument registers */
                        M_INTMOVE(s1, REG_A0);
@@ -739,12 +697,13 @@ bool codegen(jitdata *jd)
                        /* move arguments into argument registers */
 
                        s1 = emit_load_s1(jd, iptr, REG_A0_A1_PACKED);
-                       M_LNGMOVE(s1, REG_A0_A1_PACKED);
-
                        s2 = emit_load_s2(jd, iptr, REG_A2_A3_PACKED);
-                       M_LNGMOVE(s2, REG_A2_A3_PACKED);
+                       /* XXX TODO: only do this if arithmetic check is really done! */
+                       M_ORR(GET_HIGH_REG(s2), GET_LOW_REG(s2), REG_ITMP3);
+                       emit_arithmetic_check(cd, iptr, REG_ITMP3);
 
-                       gen_div_check(VAROP(iptr->sx.s23.s2)->type, s2);
+                       M_LNGMOVE(s1, REG_A0_A1_PACKED);
+                       M_LNGMOVE(s2, REG_A2_A3_PACKED);
 
                        /* call builtin function */
                        bte = iptr->sx.s23.s3.bte;
@@ -793,10 +752,10 @@ bool codegen(jitdata *jd)
                        M_MOV_S(REG_ITMP1, s1);
                        M_RSBMI_IMM(REG_ITMP1, REG_ITMP1, 0);
                        if (IS_IMM(iptr->sx.val.i))
-                               M_AND_IMM(d, REG_ITMP1, iptr->sx.val.i);
+                               M_AND_IMM(REG_ITMP1, iptr->sx.val.i, d);
                        else {
                                ICONST(REG_ITMP3, iptr->sx.val.i);
-                               M_AND(d, REG_ITMP1, REG_ITMP3);
+                               M_AND(REG_ITMP1, REG_ITMP3, d);
                        }
                        M_RSBMI_IMM(d, d, 0);
                        emit_store_dst(jd, iptr, d);
@@ -807,7 +766,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       M_AND_IMM(REG_ITMP2, s2, 0x1f);
+                       M_AND_IMM(s2, 0x1f, REG_ITMP2);
                        M_MOV(d, REG_LSL_REG(s1, REG_ITMP2));
                        emit_store_dst(jd, iptr, d);
                        break;
@@ -817,7 +776,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       M_AND_IMM(REG_ITMP2, s2, 0x1f);
+                       M_AND_IMM(s2, 0x1f, REG_ITMP2);
                        M_MOV(d, REG_ASR_REG(s1, REG_ITMP2));
                        emit_store_dst(jd, iptr, d);
                        break;
@@ -827,7 +786,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       M_AND_IMM(REG_ITMP2, s2, 0x1f);
+                       M_AND_IMM(s2, 0x1f, REG_ITMP2);
                        M_MOV(d, REG_LSR_REG(s1, REG_ITMP2));
                        emit_store_dst(jd, iptr, d);
                        break;
@@ -873,7 +832,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       M_AND(d, s1, s2);
+                       M_AND(s1, s2, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -882,10 +841,10 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1_low(jd, iptr, REG_ITMP3);
                        s2 = emit_load_s2_low(jd, iptr, REG_ITMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP12_PACKED);
-                       M_AND(GET_LOW_REG(d), s1, s2);
+                       M_AND(s1, s2, GET_LOW_REG(d));
                        s1 = emit_load_s1_high(jd, iptr, REG_ITMP3);
                        s2 = emit_load_s2_high(jd, iptr, REG_ITMP2);
-                       M_AND(GET_HIGH_REG(d), s1, s2);
+                       M_AND(s1, s2, GET_HIGH_REG(d));
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -894,7 +853,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       M_ORR(d, s1, s2);
+                       M_ORR(s1, s2, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -903,10 +862,10 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1_low(jd, iptr, REG_ITMP3);
                        s2 = emit_load_s2_low(jd, iptr, REG_ITMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP12_PACKED);
-                       M_ORR(GET_LOW_REG(d), s1, s2);
+                       M_ORR(s1, s2, GET_LOW_REG(d));
                        s1 = emit_load_s1_high(jd, iptr, REG_ITMP3);
                        s2 = emit_load_s2_high(jd, iptr, REG_ITMP2);
-                       M_ORR(GET_HIGH_REG(d), s1, s2);
+                       M_ORR(s1, s2, GET_HIGH_REG(d));
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -915,7 +874,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       M_EOR(d, s1, s2);
+                       M_EOR(s1, s2, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -924,10 +883,10 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1_low(jd, iptr, REG_ITMP3);
                        s2 = emit_load_s2_low(jd, iptr, REG_ITMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP12_PACKED);
-                       M_EOR(GET_LOW_REG(d), s1, s2);
+                       M_EOR(s1, s2, GET_LOW_REG(d));
                        s1 = emit_load_s1_high(jd, iptr, REG_ITMP3);
                        s2 = emit_load_s2_high(jd, iptr, REG_ITMP2);
-                       M_EOR(GET_HIGH_REG(d), s1, s2);
+                       M_EOR(s1, s2, GET_HIGH_REG(d));
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -940,7 +899,7 @@ bool codegen(jitdata *jd)
 
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_MNFS(d, s1);
+                       M_FNEG(s1, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -949,7 +908,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_ADFS(d, s1, s2);
+                       M_FADD(s1, s2, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -958,7 +917,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_SUFS(d, s1, s2);
+                       M_FSUB(s1, s2, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -967,7 +926,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_MUFS(d, s1, s2);
+                       M_FMUL(s1, s2, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -975,13 +934,14 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_DVFS(d, s1, s2);
+                       M_FDIV(s1, s2, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
                /* ATTENTION: Jave does not want IEEE behaviour in FREM, do
                   not use this */
 
+#if 0
                case ICMD_FREM:       /* ..., val1, val2  ==> ..., val1 % val2        */
 
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
@@ -990,12 +950,13 @@ bool codegen(jitdata *jd)
                        M_RMFS(d, s1, s2);
                        emit_store_dst(jd, iptr, d);
                        break;
+#endif
 
                case ICMD_DNEG:       /* ..., value  ==> ..., - value                 */
 
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_MNFD(d, s1);
+                       M_DNEG(s1, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1004,7 +965,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_ADFD(d, s1, s2);
+                       M_DADD(s1, s2, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1013,7 +974,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_SUFD(d, s1, s2);
+                       M_DSUB(s1, s2, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1022,7 +983,7 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_MUFD(d, s1, s2);
+                       M_DMUL(s1, s2, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1031,13 +992,14 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_DVFD(d, s1, s2);
+                       M_DDIV(s1, s2, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
                /* ATTENTION: Jave does not want IEEE behaviour in DREM, do
                   not use this */
 
+#if 0
                case ICMD_DREM:       /* ..., val1, val2  ==> ..., val1 % val2        */
 
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
@@ -1046,12 +1008,13 @@ bool codegen(jitdata *jd)
                        M_RMFD(d, s1, s2);
                        emit_store_dst(jd, iptr, d);
                        break;
+#endif
 
                case ICMD_I2F:       /* ..., value  ==> ..., (float) value            */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_FLTS(d, s1);
+                       M_CVTIF(s1, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1059,7 +1022,7 @@ bool codegen(jitdata *jd)
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_FLTD(d, s1);
+                       M_CVTID(s1, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1068,10 +1031,12 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
                        /* this uses round towards zero, as Java likes it */
-                       M_FIX(d, s1);
+                       M_CVTFI(s1, d);
+#if !defined(__VFP_FP__)
                        /* this checks for NaN; to return zero as Java likes it */
-                       M_CMF(s1, 0x8);
-                       M_MOVVS_IMM(d, 0);
+                       M_FCMP(s1, 0x8);
+                       M_MOVVS_IMM(0, d);
+#endif
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1080,10 +1045,12 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
                        /* this uses round towards zero, as Java likes it */
-                       M_FIX(d, s1);
+                       M_CVTDI(s1, d);
+#if !defined(__VFP_FP__)
                        /* this checks for NaN; to return zero as Java likes it */
-                       M_CMF(s1, 0x8);
-                       M_MOVVS_IMM(d, 0);
+                       M_DCMP(s1, 0x8);
+                       M_MOVVS_IMM(0, d);
+#endif
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1091,7 +1058,7 @@ bool codegen(jitdata *jd)
 
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP2);
-                       M_MVFS(d,s1);
+                       M_CVTDF(s1, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1099,7 +1066,7 @@ bool codegen(jitdata *jd)
 
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP2);
-                       M_MVFD(d,s1);
+                       M_CVTFD(s1, d);
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1108,8 +1075,11 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       M_CMF(s2, s1);
+                       M_FCMP(s2, s1);
                        M_MOV_IMM(d, 0);
+#if defined(__VFP_FP__)
+                       M_FMSTAT; /* on VFP we need to transfer the flags */
+#endif
                        M_SUBGT_IMM(d, d, 1);
                        M_ADDLT_IMM(d, d, 1);
                        emit_store_dst(jd, iptr, d);
@@ -1120,8 +1090,11 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       M_CMF(s2, s1);
+                       M_DCMP(s2, s1);
                        M_MOV_IMM(d, 0);
+#if defined(__VFP_FP__)
+                       M_FMSTAT; /* on VFP we need to transfer the flags */
+#endif
                        M_SUBGT_IMM(d, d, 1);
                        M_ADDLT_IMM(d, d, 1);
                        emit_store_dst(jd, iptr, d);
@@ -1132,8 +1105,11 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       M_CMF(s1, s2);
+                       M_FCMP(s1, s2);
                        M_MOV_IMM(d, 0);
+#if defined(__VFP_FP__)
+                       M_FMSTAT; /* on VFP we need to transfer the flags */
+#endif
                        M_SUBLT_IMM(d, d, 1);
                        M_ADDGT_IMM(d, d, 1);
                        emit_store_dst(jd, iptr, d);
@@ -1144,8 +1120,11 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
                        s2 = emit_load_s2(jd, iptr, REG_FTMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       M_CMF(s1, s2);
+                       M_DCMP(s1, s2);
                        M_MOV_IMM(d, 0);
+#if defined(__VFP_FP__)
+                       M_FMSTAT; /* on VFP we need to transfer the flags */
+#endif
                        M_SUBLT_IMM(d, d, 1);
                        M_ADDGT_IMM(d, d, 1);
                        emit_store_dst(jd, iptr, d);
@@ -1160,78 +1139,56 @@ bool codegen(jitdata *jd)
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP2);
-                       gen_nullptr_check(s1);
-                       M_ILD_INTERN(d, s1, OFFSET(java_arrayheader, size));
-                       emit_store_dst(jd, iptr, d);
-                       break;
-
-               case ICMD_AALOAD:     /* ..., arrayref, index  ==> ..., value         */
-
-                       s1 = emit_load_s1(jd, iptr, REG_ITMP1);
-                       s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
-                       M_ADD(REG_ITMP1, s1, REG_LSL(s2, 2)); /* REG_ITMP1 = s1 + 4 * s2 */
-                       M_LDR_INTERN(d, REG_ITMP1, OFFSET(java_objectarray, data[0]));
+                       /* implicit null-pointer check */
+                       M_ILD_INTERN(d, s1, OFFSET(java_array_t, size));
                        emit_store_dst(jd, iptr, d);
                        break;
 
-               case ICMD_IALOAD:     /* ..., arrayref, index  ==> ..., value         */
+               case ICMD_BALOAD:     /* ..., arrayref, index  ==> ..., value         */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
-                       M_ADD(REG_ITMP1, s1, REG_LSL(s2, 2)); /* REG_ITMP1 = s1 + 4 * s2 */
-                       M_ILD_INTERN(d, REG_ITMP1, OFFSET(java_intarray, data[0]));
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
+                       M_ADD(REG_ITMP1, s1, s2); /* REG_ITMP1 = s1 + 1 * s2 */
+                       M_LDRSB(d, REG_ITMP1, OFFSET(java_bytearray_t, data[0]));
                        emit_store_dst(jd, iptr, d);
                        break;
 
-               case ICMD_BALOAD:     /* ..., arrayref, index  ==> ..., value         */
+               case ICMD_CALOAD:     /* ..., arrayref, index  ==> ..., value         */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
-                       M_ADD(REG_ITMP1, s1, s2); /* REG_ITMP1 = s1 + 1 * s2 */
-                       M_LDRSB(d, REG_ITMP1, OFFSET(java_bytearray, data[0]));
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
+                       M_ADD(REG_ITMP1, s1, REG_LSL(s2, 1)); /* REG_ITMP1 = s1 + 2 * s2 */
+                       M_LDRH(d, REG_ITMP1, OFFSET(java_chararray_t, data[0]));
                        emit_store_dst(jd, iptr, d);
                        break;
 
-               case ICMD_CALOAD:     /* ..., arrayref, index  ==> ..., value         */
+               case ICMD_SALOAD:     /* ..., arrayref, index  ==> ..., value         */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        M_ADD(REG_ITMP1, s1, REG_LSL(s2, 1)); /* REG_ITMP1 = s1 + 2 * s2 */
-                       M_LDRH(d, REG_ITMP1, OFFSET(java_chararray, data[0]));
+                       M_LDRSH(d, REG_ITMP1, OFFSET(java_shortarray_t, data[0]));
                        emit_store_dst(jd, iptr, d);
                        break;
 
-               case ICMD_SALOAD:     /* ..., arrayref, index  ==> ..., value         */
+               case ICMD_IALOAD:     /* ..., arrayref, index  ==> ..., value         */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
-                       M_ADD(REG_ITMP1, s1, REG_LSL(s2, 1)); /* REG_ITMP1 = s1 + 2 * s2 */
-                       M_LDRSH(d, REG_ITMP1, OFFSET(java_shortarray, data[0]));
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
+                       M_ADD(REG_ITMP1, s1, REG_LSL(s2, 2)); /* REG_ITMP1 = s1 + 4 * s2 */
+                       M_ILD_INTERN(d, REG_ITMP1, OFFSET(java_intarray_t, data[0]));
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1240,12 +1197,10 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP12_PACKED);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        M_ADD(REG_ITMP3, s1, REG_LSL(s2, 3)); /* REG_ITMP3 = s1 + 8 * s2 */
-                       M_LLD_INTERN(d, REG_ITMP3, OFFSET(java_longarray, data[0]));
+                       M_LLD_INTERN(d, REG_ITMP3, OFFSET(java_longarray_t, data[0]));
                        emit_store_dst(jd, iptr, d);
                        break;
 
@@ -1253,17 +1208,15 @@ bool codegen(jitdata *jd)
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        M_ADD(REG_ITMP1, s1, REG_LSL(s2, 2)); /* REG_ITMP1 = s1 + 4 * s2 */
 #if !defined(ENABLE_SOFTFLOAT)
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_FLD_INTERN(d, REG_ITMP1, OFFSET(java_floatarray, data[0]));
+                       M_FLD_INTERN(d, REG_ITMP1, OFFSET(java_floatarray_t, data[0]));
 #else
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
-                       M_ILD_INTERN(d, REG_ITMP1, OFFSET(java_floatarray, data[0]));
+                       M_ILD_INTERN(d, REG_ITMP1, OFFSET(java_floatarray_t, data[0]));
 #endif
                        emit_store_dst(jd, iptr, d);
                        break;
@@ -1272,136 +1225,99 @@ bool codegen(jitdata *jd)
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        M_ADD(REG_ITMP3, s1, REG_LSL(s2, 3)); /* REG_ITMP3 = s1 + 8 * s2 */
 #if !defined(ENABLE_SOFTFLOAT)
                        d = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                       M_DLD_INTERN(d, REG_ITMP3, OFFSET(java_doublearray, data[0]));
+                       M_DLD_INTERN(d, REG_ITMP3, OFFSET(java_doublearray_t, data[0]));
 #else
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP12_PACKED);
-                       M_LLD_INTERN(d, REG_ITMP3, OFFSET(java_doublearray, data[0]));
+                       M_LLD_INTERN(d, REG_ITMP3, OFFSET(java_doublearray_t, data[0]));
 #endif
                        emit_store_dst(jd, iptr, d);
                        break;
 
-               case ICMD_AASTORE:    /* ..., arrayref, index, value  ==> ...         */
-
-                       s1 = emit_load_s1(jd, iptr, REG_A0);
-                       s2 = emit_load_s2(jd, iptr, REG_ITMP1);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
-                       s3 = emit_load_s3(jd, iptr, REG_A1);
-
-                       /* move arguments to argument registers */
-                       M_INTMOVE(s1, REG_A0);
-                       M_INTMOVE(s3, REG_A1);
-
-                       /* call builtin function */
-                       disp = dseg_add_functionptr(cd, BUILTIN_canstore);
-                       M_DSEG_BRANCH(disp);
-
-                       /* recompute pv */
-                       s1 = (s4) (cd->mcodeptr - cd->mcodebase);
-                       M_RECOMPUTE_PV(s1);
-
-                       /* check resturn value of builtin */
-                       M_TST(REG_RESULT, REG_RESULT);
-                       M_BEQ(0);
-                       codegen_add_arraystoreexception_ref(cd);
+               case ICMD_AALOAD:     /* ..., arrayref, index  ==> ..., value         */
 
-                       /* finally store address into array */
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       s3 = emit_load_s3(jd, iptr, REG_ITMP3);
+                       d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        M_ADD(REG_ITMP1, s1, REG_LSL(s2, 2)); /* REG_ITMP1 = s1 + 4 * s2 */
-                       M_STR_INTERN(s3, REG_ITMP1, OFFSET(java_objectarray, data[0]));
+                       M_LDR_INTERN(d, REG_ITMP1, OFFSET(java_objectarray_t, data[0]));
+                       emit_store_dst(jd, iptr, d);
                        break;
 
-               case ICMD_IASTORE:    /* ..., arrayref, index, value  ==> ...         */
+               case ICMD_BASTORE:    /* ..., arrayref, index, value  ==> ...         */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        s3 = emit_load_s3(jd, iptr, REG_ITMP3);
-                       M_ADD(REG_ITMP1, s1, REG_LSL(s2, 2)); /* REG_ITMP1 = s1 + 4 * s2 */
-                       M_IST_INTERN(s3, REG_ITMP1, OFFSET(java_intarray, data[0]));
+                       M_ADD(REG_ITMP1, s1, s2); /* REG_ITMP1 = s1 + 1 * s2 */
+                       M_STRB(s3, REG_ITMP1, OFFSET(java_bytearray_t, data[0]));
                        break;
 
-               case ICMD_BASTORE:    /* ..., arrayref, index, value  ==> ...         */
+               case ICMD_CASTORE:    /* ..., arrayref, index, value  ==> ...         */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        s3 = emit_load_s3(jd, iptr, REG_ITMP3);
-                       M_ADD(REG_ITMP1, s1, s2); /* REG_ITMP1 = s1 + 1 * s2 */
-                       M_STRB(s3, REG_ITMP1, OFFSET(java_bytearray, data[0]));
+                       M_ADD(REG_ITMP1, s1, REG_LSL(s2, 1)); /* REG_ITMP1 = s1 + 2 * s2 */
+                       M_STRH(s3, REG_ITMP1, OFFSET(java_chararray_t, data[0]));
                        break;
 
-               case ICMD_CASTORE:    /* ..., arrayref, index, value  ==> ...         */
+               case ICMD_SASTORE:    /* ..., arrayref, index, value  ==> ...         */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        s3 = emit_load_s3(jd, iptr, REG_ITMP3);
                        M_ADD(REG_ITMP1, s1, REG_LSL(s2, 1)); /* REG_ITMP1 = s1 + 2 * s2 */
-                       M_STRH(s3, REG_ITMP1, OFFSET(java_chararray, data[0]));
+                       M_STRH(s3, REG_ITMP1, OFFSET(java_shortarray_t, data[0]));
                        break;
 
-               case ICMD_SASTORE:    /* ..., arrayref, index, value  ==> ...         */
+               case ICMD_IASTORE:    /* ..., arrayref, index, value  ==> ...         */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        s3 = emit_load_s3(jd, iptr, REG_ITMP3);
-                       M_ADD(REG_ITMP1, s1, REG_LSL(s2, 1)); /* REG_ITMP1 = s1 + 2 * s2 */
-                       M_STRH(s3, REG_ITMP1, OFFSET(java_shortarray, data[0]));
+                       M_ADD(REG_ITMP1, s1, REG_LSL(s2, 2)); /* REG_ITMP1 = s1 + 4 * s2 */
+                       M_IST_INTERN(s3, REG_ITMP1, OFFSET(java_intarray_t, data[0]));
                        break;
 
                case ICMD_LASTORE:    /* ..., arrayref, index, value  ==> ...         */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        M_ADD(REG_ITMP3, s1, REG_LSL(s2, 3)); /* REG_ITMP3 = s1 + 8 * s2 */
                        s3 = emit_load_s3(jd, iptr, REG_ITMP12_PACKED);
-                       M_LST_INTERN(s3, REG_ITMP3, OFFSET(java_longarray, data[0]));
+                       M_LST_INTERN(s3, REG_ITMP3, OFFSET(java_longarray_t, data[0]));
                        break;
 
                case ICMD_FASTORE:    /* ..., arrayref, index, value  ==> ...         */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        M_ADD(REG_ITMP1, s1, REG_LSL(s2, 2)); /* REG_ITMP1 = s1 + 4 * s2 */
 #if !defined(ENABLE_SOFTFLOAT)
                        s3 = emit_load_s3(jd, iptr, REG_FTMP1);
-                       M_FST_INTERN(s3, REG_ITMP1, OFFSET(java_floatarray, data[0]));
+                       M_FST_INTERN(s3, REG_ITMP1, OFFSET(java_floatarray_t, data[0]));
 #else
                        s3 = emit_load_s3(jd, iptr, REG_ITMP3);
-                       M_IST_INTERN(s3, REG_ITMP1, OFFSET(java_floatarray, data[0]));
+                       M_IST_INTERN(s3, REG_ITMP1, OFFSET(java_floatarray_t, data[0]));
 #endif
                        break;
 
@@ -1409,47 +1325,68 @@ bool codegen(jitdata *jd)
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               gen_nullptr_check(s1);
-                               gen_bound_check(s1, s2);
-                       }
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
                        M_ADD(REG_ITMP1, s1, REG_LSL(s2, 3)); /* REG_ITMP1 = s1 + 8 * s2 */
 #if !defined(ENABLE_SOFTFLOAT)
                        s3 = emit_load_s3(jd, iptr, REG_FTMP1);
-                       M_DST_INTERN(s3, REG_ITMP1, OFFSET(java_doublearray, data[0]));
+                       M_DST_INTERN(s3, REG_ITMP1, OFFSET(java_doublearray_t, data[0]));
 #else
                        s3 = emit_load_s3(jd, iptr, REG_ITMP23_PACKED);
-                       M_LST_INTERN(s3, REG_ITMP1, OFFSET(java_doublearray, data[0]));
+                       M_LST_INTERN(s3, REG_ITMP1, OFFSET(java_doublearray_t, data[0]));
 #endif
                        break;
 
-               case ICMD_GETSTATIC:  /* ...  ==> ..., value                          */
+               case ICMD_AASTORE:    /* ..., arrayref, index, value  ==> ...         */
 
-                       if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
-                               unresolved_field *uf = iptr->sx.s23.s3.uf;
+                       s1 = emit_load_s1(jd, iptr, REG_A0);
+                       s2 = emit_load_s2(jd, iptr, REG_ITMP1);
+                       s3 = emit_load_s3(jd, iptr, REG_A1);
 
-                               fieldtype = uf->fieldref->parseddesc.fd->type;
+                       /* implicit null-pointer check */
+                       emit_arrayindexoutofbounds_check(cd, iptr, s1, s2);
 
-                               disp = dseg_add_unique_address(cd, NULL);
+                       /* move arguments to argument registers */
+                       M_INTMOVE(s1, REG_A0);
+                       M_INTMOVE(s3, REG_A1);
+
+                       /* call builtin function */
+                       disp = dseg_add_functionptr(cd, BUILTIN_FAST_canstore);
+                       M_DSEG_BRANCH(disp);
+
+                       /* recompute pv */
+                       s1 = (s4) (cd->mcodeptr - cd->mcodebase);
+                       M_RECOMPUTE_PV(s1);
+
+                       /* check resturn value of builtin */
+                       emit_arraystore_check(cd, iptr);
+
+                       /* finally store address into array */
+                       s1 = emit_load_s1(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2(jd, iptr, REG_ITMP2);
+                       s3 = emit_load_s3(jd, iptr, REG_ITMP3);
+                       M_ADD(REG_ITMP1, s1, REG_LSL(s2, 2)); /* REG_ITMP1 = s1 + 4 * s2 */
+                       M_STR_INTERN(s3, REG_ITMP1, OFFSET(java_objectarray_t, data[0]));
+                       break;
+
+               case ICMD_GETSTATIC:  /* ...  ==> ..., value                          */
 
-                               codegen_addpatchref(cd, PATCHER_get_putstatic, uf, disp);
+                       if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
+                               uf        = iptr->sx.s23.s3.uf;
+                               fieldtype = uf->fieldref->parseddesc.fd->type;
+                               disp      = dseg_add_unique_address(cd, NULL);
 
-                               if (opt_showdisassemble)
-                                       M_NOP;
+                               patcher_add_patch_ref(jd, PATCHER_get_putstatic, uf, disp);
                        }
                        else {
-                               fieldinfo *fi = iptr->sx.s23.s3.fmiref->p.field;
-
+                               fi        = iptr->sx.s23.s3.fmiref->p.field;
                                fieldtype = fi->type;
+                               disp      = dseg_add_address(cd, fi->value);
 
-                               if (!CLASS_IS_OR_ALMOST_INITIALIZED(fi->class)) {
-                                       codegen_addpatchref(cd, PATCHER_clinit, fi->class, 0);
-
-                                       if (opt_showdisassemble)
-                                               M_NOP;
+                               if (!CLASS_IS_OR_ALMOST_INITIALIZED(fi->clazz)) {
+                                       patcher_add_patch_ref(jd, PATCHER_initialize_class,
+                                                           fi->clazz, 0);
                                }
-
-                               disp = dseg_add_address(cd, &(fi->value));
                        }
 
                        M_DSEG_LOAD(REG_ITMP3, disp);
@@ -1488,30 +1425,21 @@ bool codegen(jitdata *jd)
                case ICMD_PUTSTATIC:  /* ..., value  ==> ...                          */
 
                        if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
-                               unresolved_field *uf = iptr->sx.s23.s3.uf;
-
+                               uf        = iptr->sx.s23.s3.uf;
                                fieldtype = uf->fieldref->parseddesc.fd->type;
+                               disp      = dseg_add_unique_address(cd, NULL);
 
-                               disp = dseg_add_unique_address(cd, NULL);
-
-                               codegen_addpatchref(cd, PATCHER_get_putstatic, uf, disp);
-
-                               if (opt_showdisassemble)
-                                       M_NOP;
+                               patcher_add_patch_ref(jd, PATCHER_get_putstatic, uf, disp);
                        }
                        else {
-                               fieldinfo *fi = iptr->sx.s23.s3.fmiref->p.field;
-
+                               fi        = iptr->sx.s23.s3.fmiref->p.field;
                                fieldtype = fi->type;
+                               disp      = dseg_add_address(cd, fi->value);
 
-                               if (!CLASS_IS_OR_ALMOST_INITIALIZED(fi->class)) {
-                                       codegen_addpatchref(cd, PATCHER_clinit, fi->class, 0);
-
-                                       if (opt_showdisassemble)
-                                               M_NOP;
+                               if (!CLASS_IS_OR_ALMOST_INITIALIZED(fi->clazz)) {
+                                       patcher_add_patch_ref(jd, PATCHER_initialize_class,
+                                                           fi->clazz, 0);
                                }
-
-                               disp = dseg_add_address(cd, &(fi->value));
                        }
 
                        M_DSEG_LOAD(REG_ITMP3, disp);
@@ -1549,33 +1477,33 @@ bool codegen(jitdata *jd)
                case ICMD_GETFIELD:   /* ..., objectref, value  ==> ...               */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP3);
-                       gen_nullptr_check(s1);
-#if !defined(ENABLE_SOFTFLOAT)
-                       /* HACK: softnull checks on floats */
-                       if (!checknull && IS_FLT_DBL_TYPE(fieldtype))
-                               gen_nullptr_check_intern(s1);
-#endif
+                       emit_nullpointer_check(cd, iptr, s1);
 
-                       if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
-                               unresolved_field *uf = iptr->sx.s23.s3.uf;
 
+                       if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
+                               uf        = iptr->sx.s23.s3.uf;
                                fieldtype = uf->fieldref->parseddesc.fd->type;
-
-                               codegen_addpatchref(cd, PATCHER_get_putfield,
-                                                                       iptr->sx.s23.s3.uf, 0);
-
-                               if (opt_showdisassemble)
-                                       M_NOP;
-
-                               disp = 0;
+                               disp      = 0;
                        }
                        else {
-                               fieldinfo *fi = iptr->sx.s23.s3.fmiref->p.field;
-
+                               fi        = iptr->sx.s23.s3.fmiref->p.field;
                                fieldtype = fi->type;
                                disp      = fi->offset;
                        }
 
+#if !defined(ENABLE_SOFTFLOAT)
+                       /* HACK: softnull checks on floats */
+                       if (!INSTRUCTION_MUST_CHECK(iptr) && IS_FLT_DBL_TYPE(fieldtype))
+                               emit_nullpointer_check_force(cd, iptr, s1);
+#endif
+
+                       if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
+                               /* XXX REMOVE ME */
+                               uf = iptr->sx.s23.s3.uf;
+
+                               patcher_add_patch_ref(jd, PATCHER_get_putfield, uf, 0);
+                       }
+
                        switch (fieldtype) {
                        case TYPE_INT:
 #if defined(ENABLE_SOFTFLOAT)
@@ -1611,26 +1539,25 @@ bool codegen(jitdata *jd)
                case ICMD_PUTFIELD:   /* ..., objectref, value  ==> ...               */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP3);
-                       gen_nullptr_check(s1);
-
-#if !defined(ENABLE_SOFTFLOAT)
-                       /* HACK: softnull checks on floats */
-                       if (!checknull && IS_FLT_DBL_TYPE(fieldtype))
-                               gen_nullptr_check_intern(s1);
-#endif
+                       emit_nullpointer_check(cd, iptr, s1);
 
                        if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
-                               unresolved_field *uf = iptr->sx.s23.s3.uf;
-
+                               uf        = iptr->sx.s23.s3.uf;
                                fieldtype = uf->fieldref->parseddesc.fd->type;
+                               disp      = 0;
                        }
                        else {
-                               fieldinfo *fi = iptr->sx.s23.s3.fmiref->p.field;
-
+                               fi        = iptr->sx.s23.s3.fmiref->p.field;
                                fieldtype = fi->type;
                                disp      = fi->offset;
                        }
 
+#if !defined(ENABLE_SOFTFLOAT)
+                       /* HACK: softnull checks on floats */
+                       if (!INSTRUCTION_MUST_CHECK(iptr) && IS_FLT_DBL_TYPE(fieldtype))
+                               emit_nullpointer_check_force(cd, iptr, s1);
+#endif
+
                        switch (fieldtype) {
                        case TYPE_INT:
 #if defined(ENABLE_SOFTFLOAT)
@@ -1656,14 +1583,10 @@ bool codegen(jitdata *jd)
                        }
 
                        if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
-                               unresolved_field *uf = iptr->sx.s23.s3.uf;
-
-                               codegen_addpatchref(cd, PATCHER_get_putfield, uf, 0);
+                               /* XXX REMOVE ME */
+                               uf = iptr->sx.s23.s3.uf;
 
-                               if (opt_showdisassemble)
-                                       M_NOP;
-
-                               disp = 0;
+                               patcher_add_patch_ref(jd, PATCHER_get_putfield, uf, 0);
                        }
 
                        switch (fieldtype) {
@@ -1701,11 +1624,8 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        M_INTMOVE(s1, REG_ITMP1_XPTR);
                        if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
-                               codegen_addpatchref(cd, PATCHER_athrow_areturn,
+                               patcher_add_patch_ref(jd, PATCHER_resolve_class,
                                                                        iptr->sx.s23.s2.uc, 0);
-
-                               if (opt_showdisassemble)
-                                       M_NOP;
                        }
                        disp = dseg_add_functionptr(cd, asm_handle_exception);
                        M_DSEG_LOAD(REG_ITMP3, disp);
@@ -1718,30 +1638,20 @@ bool codegen(jitdata *jd)
                case ICMD_GOTO:         /* ... ==> ...                                */
                case ICMD_RET:
 
-                       M_B(0);
-                       codegen_addreference(cd, iptr->dst.block);
+                       emit_br(cd, iptr->dst.block);
                        break;
 
                case ICMD_JSR:          /* ... ==> ...                                */
 
-                       M_B(0);
-                       codegen_addreference(cd, iptr->sx.s23.s3.jsrtarget.block);
+                       emit_br(cd, iptr->sx.s23.s3.jsrtarget.block);
                        break;
                
                case ICMD_IFNULL:       /* ..., value ==> ...                         */
+               case ICMD_IFNONNULL:
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        M_TEQ_IMM(s1, 0);
-                       M_BEQ(0);
-                       codegen_addreference(cd, iptr->dst.block);
-                       break;
-
-               case ICMD_IFNONNULL:    /* ..., value ==> ...                         */
-
-                       s1 = emit_load_s1(jd, iptr, REG_ITMP1);
-                       M_TEQ_IMM(s1, 0);
-                       M_BNE(0);
-                       codegen_addreference(cd, iptr->dst.block);
+                       emit_bcc(cd, iptr->dst.block, iptr->opc - ICMD_IFNULL, BRANCH_OPT_NONE);
                        break;
 
                case ICMD_IFLT:         /* ..., value ==> ...                         */
@@ -1752,201 +1662,316 @@ bool codegen(jitdata *jd)
                case ICMD_IFNE:
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
-                       M_COMPARE(s1, iptr->sx.val.i, UNCOND, 0);
+                       M_COMPARE(s1, iptr->sx.val.i);
+                       emit_bcc(cd, iptr->dst.block, iptr->opc - ICMD_IFEQ, BRANCH_OPT_NONE);
+                       break;
 
-                       switch(iptr->opc) {
-                       case ICMD_IFLT:
-                               M_BLT(0);
-                               break;
-                       case ICMD_IFLE:
-                               M_BLE(0);
-                               break;
-                       case ICMD_IFGT:
-                               M_BGT(0);
-                               break;
-                       case ICMD_IFGE:
-                               M_BGE(0);
-                               break;
-                       case ICMD_IFEQ:
-                               M_BEQ(0);
-                               break;
-                       case ICMD_IFNE:
-                               M_BNE(0);
-                               break;
-                       default:
-                               assert(0);
+               case ICMD_IF_LEQ:       /* ..., value ==> ...                         */
+
+                       s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s1_low(jd, iptr, REG_ITMP2);
+                       if (iptr->sx.val.l == 0) {
+                               M_ORR_S(s1, s2, REG_ITMP3);
                        }
-                       codegen_addreference(cd, iptr->dst.block);
+                       else {
+                               M_COMPARE(s1, (iptr->sx.val.l >> 32));
+                               /*ICONST(REG_ITMP3, iptr->sx.val.l >> 32);
+                               M_CMP(s1, REG_ITMP3);*/
+                               ICONST(REG_ITMP3, iptr->sx.val.l & 0xffffffff);
+                               M_CMPEQ(s2, REG_ITMP3);
+                       }
+                       emit_beq(cd, iptr->dst.block);
                        break;
 
                case ICMD_IF_LLT:       /* ..., value ==> ...                         */
-               case ICMD_IF_LLE:       /* op1 = target JavaVM pc, val.l = constant   */
-               case ICMD_IF_LGT:
-               case ICMD_IF_LGE:
-               case ICMD_IF_LEQ:
-               case ICMD_IF_LNE:
 
-                       /* ATTENTION: compare high words signed and low words unsigned */
+                       s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s1_low(jd, iptr, REG_ITMP2);
+                       if (iptr->sx.val.l == 0) {
+                               /* if high word is less than zero, the whole long is too */
+                               M_CMP_IMM(s1, 0);
+                               emit_blt(cd, iptr->dst.block);
+                       }
+                       else {
+                               /* high compare: x=0(ifLT) ; x=1(ifEQ) ; x=2(ifGT) */
+                               M_COMPARE(s1, (iptr->sx.val.l >> 32));
+                               /*ICONST(REG_ITMP3, iptr->sx.val.l >> 32);
+                               M_CMP(s1, REG_ITMP3);*/
+                               M_EOR(REG_ITMP1, REG_ITMP1, REG_ITMP1);
+                               M_MOVGT_IMM(2, REG_ITMP1);
+                               M_MOVEQ_IMM(1, REG_ITMP1);
+
+                               /* low compare: x=x-1(ifLO) */
+                               M_COMPARE(s2, (iptr->sx.val.l & 0xffffffff));
+                               /*ICONST(REG_ITMP3, iptr->sx.val.l & 0xffffffff);
+                               M_CMP(s2, REG_ITMP3);*/
+                               M_SUBLO_IMM(REG_ITMP1, REG_ITMP1, 1);
+
+                               /* branch if (x LT 1) */
+                               M_CMP_IMM(REG_ITMP1, 1);
+                               emit_blt(cd, iptr->dst.block);
+                       }
+                       break;
+
+               case ICMD_IF_LLE:       /* ..., value ==> ...                         */
 
                        s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
-                       M_COMPARE(s1, (iptr->sx.val.l >> 32), UNCOND, 0);
+                       s2 = emit_load_s1_low(jd, iptr, REG_ITMP2);
+                       if (iptr->sx.val.l == 0) {
+                               /* if high word is less than zero, the whole long is too  */
+                               M_CMP_IMM(s1, 0);
+                               emit_blt(cd, iptr->dst.block);
 
-                       switch(iptr->opc) {
-                       case ICMD_IF_LLT:
-                       case ICMD_IF_LLE:
-                               M_BLT(0);
-                               codegen_addreference(cd, iptr->dst.block);
-                               break;
-                       case ICMD_IF_LGT:
-                       case ICMD_IF_LGE:
-                               M_BGT(0);
-                               codegen_addreference(cd, iptr->dst.block);
-                               break;
-                       case ICMD_IF_LEQ: /* EQ and NE are the same for unsigned */
-                       case ICMD_IF_LNE:
-                               break;
-                       default:
-                               assert(0);
+                               /* ... otherwise the low word has to be zero (tricky!) */
+                               M_CMPEQ_IMM(s2, 0);
+                               emit_beq(cd, iptr->dst.block);
                        }
+                       else {
+                               /* high compare: x=0(ifLT) ; x=1(ifEQ) ; x=2(ifGT) */
+                               M_COMPARE(s1, (iptr->sx.val.l >> 32));
+                               /*ICONST(REG_ITMP3, iptr->sx.val.l >> 32);
+                               M_CMP(s1, REG_ITMP3);*/
+                               M_EOR(REG_ITMP1, REG_ITMP1, REG_ITMP1);
+                               M_MOVGT_IMM(2, REG_ITMP1);
+                               M_MOVEQ_IMM(1, REG_ITMP1);
 
-                       s1 = emit_load_s1_low(jd, iptr, REG_ITMP1);
+                               /* low compare: x=x+1(ifHI) */
+                               M_COMPARE(s2, (iptr->sx.val.l & 0xffffffff));
+                               /*ICONST(REG_ITMP3, iptr->sx.val.l & 0xffffffff);
+                               M_CMP(s2, REG_ITMP3);*/
+                               M_ADDHI_IMM(REG_ITMP1, REG_ITMP1, 1);
 
-                       switch(iptr->opc) {
-                       case ICMD_IF_LLT:
-                               M_COMPARE(s1, (iptr->sx.val.l & 0xffffffff), COND_EQ, 1);
-                               M_BLO(0);
-                               break;
-                       case ICMD_IF_LLE:
-                               M_COMPARE(s1, (iptr->sx.val.l & 0xffffffff), COND_EQ, 1);
-                               M_BLS(0);
-                               break;
-                       case ICMD_IF_LGT:
-                               M_COMPARE(s1, (iptr->sx.val.l & 0xffffffff), COND_EQ, 1);
-                               M_BHI(0);
-                               break;
-                       case ICMD_IF_LGE:
-                               M_COMPARE(s1, (iptr->sx.val.l & 0xffffffff), COND_EQ, 1);
-                               M_BHS(0);
-                               break;
-                       case ICMD_IF_LEQ:
-                               M_COMPARE(s1, (iptr->sx.val.l & 0xffffffff), COND_EQ, 0);
-                               M_BEQ(0);
-                               break;
-                       case ICMD_IF_LNE:
-                               M_COMPARE(s1, (iptr->sx.val.l & 0xffffffff), COND_EQ, 0);
-                               M_BNE(0);
-                               break;
-                       default:
-                               assert(0);
+                               /* branch if (x LE 1) */
+                               M_CMP_IMM(REG_ITMP1, 1);
+                               emit_ble(cd, iptr->dst.block);
                        }
-                       codegen_addreference(cd, iptr->dst.block);
                        break;
 
-               case ICMD_IF_ICMPEQ:    /* ..., value, value ==> ...                  */
-               case ICMD_IF_ACMPEQ:    /* op1 = target JavaVM pc                     */
-               case ICMD_IF_ICMPNE:
-               case ICMD_IF_ACMPNE:
-               case ICMD_IF_ICMPLT:
-               case ICMD_IF_ICMPLE:
-               case ICMD_IF_ICMPGT:
-               case ICMD_IF_ICMPGE:
+               case ICMD_IF_LGE:       /* ..., value ==> ...                         */
 
-                       s1 = emit_load_s1(jd, iptr, REG_ITMP1);
-                       s2 = emit_load_s2(jd, iptr, REG_ITMP2);
-                       M_CMP(s1, s2);
-                       switch(iptr->opc) {
-                       case ICMD_IF_ICMPLT:
-                               M_BLT(0);
-                               break;
-                       case ICMD_IF_ICMPLE:
-                               M_BLE(0);
-                               break;
-                       case ICMD_IF_ICMPGT:
+                       s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s1_low(jd, iptr, REG_ITMP2);
+                       if (iptr->sx.val.l == 0) {
+                               /* if high word is greater or equal zero, the whole long is too */
+                               M_CMP_IMM(s1, 0);
+                               emit_bge(cd, iptr->dst.block);
+                       }
+                       else {
+                               /* high compare: x=0(ifLT) ; x=1(ifEQ) ; x=2(ifGT) */
+                               M_COMPARE(s1, (iptr->sx.val.l >> 32));
+                               /*ICONST(REG_ITMP3, iptr->sx.val.l >> 32);
+                               M_CMP(s1, REG_ITMP3);*/
+                               M_EOR(REG_ITMP1, REG_ITMP1, REG_ITMP1);
+                               M_MOVGT_IMM(2, REG_ITMP1);
+                               M_MOVEQ_IMM(1, REG_ITMP1);
+
+                               /* low compare: x=x-1(ifLO) */
+                               M_COMPARE(s2, (iptr->sx.val.l & 0xffffffff));
+                               /*ICONST(REG_ITMP3, iptr->sx.val.l & 0xffffffff);
+                               M_CMP(s2, REG_ITMP3);*/
+                               M_SUBLO_IMM(REG_ITMP1, REG_ITMP1, 1);
+
+                               /* branch if (x GE 1) */
+                               M_CMP_IMM(REG_ITMP1, 1);
+                               emit_bge(cd, iptr->dst.block);
+                       }
+                       break;
+
+               case ICMD_IF_LGT:       /* ..., value ==> ...                         */
+
+                       s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s1_low(jd, iptr, REG_ITMP2);
+#if 0
+                       if (iptr->sx.val.l == 0) {
+                               /* if high word is greater than zero, the whole long is too */
+                               M_CMP_IMM(s1, 0);
                                M_BGT(0);
-                               break;
-                       case ICMD_IF_ICMPGE:
-                               M_BGE(0);
-                               break;
-                       case ICMD_IF_ICMPEQ:
-                       case ICMD_IF_ACMPEQ:
-                               M_BEQ(0);
-                               break;
-                       case ICMD_IF_ICMPNE:
-                       case ICMD_IF_ACMPNE:
+                               codegen_add_branch_ref(cd, iptr->dst.block);
+
+                               /* ... or high was zero and low is non zero (tricky!) */
+                               M_EOR(REG_ITMP3, REG_ITMP3, REG_ITMP3);
+                               M_MOVLT_IMM(1, REG_ITMP3);
+                               M_ORR_S(REG_ITMP3, s2, REG_ITMP3);
                                M_BNE(0);
-                               break;
-                       default:
-                               assert(0);
+                               codegen_add_branch_ref(cd, iptr->dst.block);
                        }
-                       codegen_addreference(cd, iptr->dst.block);
+                       else {
+#endif
+                               /* high compare: x=0(ifLT) ; x=1(ifEQ) ; x=2(ifGT) */
+                               M_COMPARE(s1, (iptr->sx.val.l >> 32));
+                               /*ICONST(REG_ITMP3, iptr->sx.val.l >> 32);
+                               M_CMP(s1, REG_ITMP3);*/
+                               M_EOR(REG_ITMP1, REG_ITMP1, REG_ITMP1);
+                               M_MOVGT_IMM(2, REG_ITMP1);
+                               M_MOVEQ_IMM(1, REG_ITMP1);
+
+                               /* low compare: x=x+1(ifHI) */
+                               M_COMPARE(s2, (iptr->sx.val.l & 0xffffffff));
+                               /*ICONST(REG_ITMP3, iptr->sx.val.l & 0xffffffff);
+                               M_CMP(s2, REG_ITMP3);*/
+                               M_ADDHI_IMM(REG_ITMP1, REG_ITMP1, 1);
+
+                               /* branch if (x GT 1) */
+                               M_CMP_IMM(REG_ITMP1, 1);
+                               emit_bgt(cd, iptr->dst.block);
+#if 0
+                       }
+#endif
+                       break;
+
+               case ICMD_IF_LNE:       /* ..., value ==> ...                         */
+
+                       s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s1_low(jd, iptr, REG_ITMP2);
+                       if (iptr->sx.val.l == 0) {
+                               M_ORR_S(s1, s2, REG_ITMP3);
+                       }
+                       else {
+                               M_COMPARE(s1, (iptr->sx.val.l >> 32));
+                               /*ICONST(REG_ITMP3, iptr->sx.val.l >> 32);
+                               M_CMP(s1, REG_ITMP3);*/
+                               ICONST(REG_ITMP3, iptr->sx.val.l & 0xffffffff);
+                               M_CMPEQ(s2, REG_ITMP3);
+                       }
+                       emit_bne(cd, iptr->dst.block);
+                       break;
+                       
+               case ICMD_IF_ICMPEQ:    /* ..., value, value ==> ...                  */
+               case ICMD_IF_ICMPNE:
+               case ICMD_IF_ICMPLT:
+               case ICMD_IF_ICMPLE:
+               case ICMD_IF_ICMPGT:
+               case ICMD_IF_ICMPGE:
+
+                       s1 = emit_load_s1(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2(jd, iptr, REG_ITMP2);
+                       M_CMP(s1, s2);
+                       emit_bcc(cd, iptr->dst.block, iptr->opc - ICMD_IF_ICMPEQ, BRANCH_OPT_NONE);
+                       break;
+
+               case ICMD_IF_ACMPEQ:    /* ..., value, value ==> ...                  */
+               case ICMD_IF_ACMPNE:
+
+                       s1 = emit_load_s1(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2(jd, iptr, REG_ITMP2);
+                       M_CMP(s1, s2);
+                       emit_bcc(cd, iptr->dst.block, iptr->opc - ICMD_IF_ACMPEQ, BRANCH_OPT_NONE);
                        break;
 
                case ICMD_IF_LCMPEQ:    /* ..., value, value ==> ...                  */
-               case ICMD_IF_LCMPNE:    /* op1 = target JavaVM pc                     */
-               case ICMD_IF_LCMPLT:
-               case ICMD_IF_LCMPLE:
-               case ICMD_IF_LCMPGT:
-               case ICMD_IF_LCMPGE:
+                                       /* op1 = target JavaVM pc                     */
 
-                       /* ATTENTION: compare high words signed and low words unsigned */
                        s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2_high(jd, iptr, REG_ITMP2);
                        M_CMP(s1, s2);
 
-                       switch(iptr->opc) {
-                       case ICMD_IF_LCMPEQ: /* EQ and NE are the same for unsigned */
-                       case ICMD_IF_LCMPNE:
-                               break;
-                       case ICMD_IF_LCMPLT:
-                       case ICMD_IF_LCMPLE:
-                               M_BLT(0);
-                               codegen_addreference(cd, iptr->dst.block);
-                               break;
-                       case ICMD_IF_LCMPGT:
-                       case ICMD_IF_LCMPGE:
-                               M_BGT(0);
-                               codegen_addreference(cd, iptr->dst.block);
-                               break;
-                       default:
-                               assert(0);
-                       }
+                       s1 = emit_load_s1_low(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2_low(jd, iptr, REG_ITMP2);
+                       M_CMPEQ(s1, s2);
+
+                       emit_beq(cd, iptr->dst.block);
+                       break;
+
+               case ICMD_IF_LCMPNE:    /* ..., value, value ==> ...                  */
+                                       /* op1 = target JavaVM pc                     */
+
+                       s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2_high(jd, iptr, REG_ITMP2);
+                       M_CMP(s1, s2);
 
                        s1 = emit_load_s1_low(jd, iptr, REG_ITMP1);
                        s2 = emit_load_s2_low(jd, iptr, REG_ITMP2);
+                       M_CMPEQ(s1, s2);
 
-                       switch(iptr->opc) {
-                       case ICMD_IF_LCMPEQ:
-                               M_DAT(COND_EQ,0x0a,0,s1,1,0,s2);
-                               M_BEQ(0);
-                               break;
-                       case ICMD_IF_LCMPNE:
-                               M_DAT(COND_EQ,0x0a,0,s1,1,0,s2);
-                               M_BNE(0);
-                               break;
-                       case ICMD_IF_LCMPLT:
-                               M_BNE(1);
-                               M_CMP(s1, s2);
-                               M_BLO(0);
-                               break;
-                       case ICMD_IF_LCMPLE:
-                               M_BNE(1);
-                               M_CMP(s1, s2);
-                               M_BLS(0);
-                               break;
-                       case ICMD_IF_LCMPGT:
-                               M_BNE(1);
-                               M_CMP(s1, s2);
-                               M_BHI(0);
-                               break;
-                       case ICMD_IF_LCMPGE:
-                               M_BNE(1);
-                               M_CMP(s1, s2);
-                               M_BHS(0);
-                               break;
-                       default:
-                               assert(0);
-                       }
-                       codegen_addreference(cd, iptr->dst.block);
+                       emit_bne(cd, iptr->dst.block);
+                       break;
+
+               case ICMD_IF_LCMPLT:    /* ..., value, value ==> ...                  */
+                                       /* op1 = target JavaVM pc                     */
+
+                       /* high compare: x=0(ifLT) ; x=1(ifEQ) ; x=2(ifGT) */
+                       s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2_high(jd, iptr, REG_ITMP2);
+                       M_CMP(s1, s2);
+                       M_EOR(REG_ITMP3, REG_ITMP3, REG_ITMP3);
+                       M_MOVGT_IMM(2, REG_ITMP3);
+                       M_MOVEQ_IMM(1, REG_ITMP3);
+
+                       /* low compare: x=x-1(ifLO) */
+                       s1 = emit_load_s1_low(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2_low(jd, iptr, REG_ITMP2);
+                       M_CMP(s1, s2);
+                       M_SUBLO_IMM(REG_ITMP3, REG_ITMP3, 1);
+
+                       /* branch if (x LT 1) */
+                       M_CMP_IMM(REG_ITMP3, 1);
+                       emit_blt(cd, iptr->dst.block);
+                       break;
+
+               case ICMD_IF_LCMPLE:    /* ..., value, value ==> ...                  */
+                                       /* op1 = target JavaVM pc                     */
+
+                       /* high compare: x=0(ifLT) ; x=1(ifEQ) ; x=2(ifGT) */
+                       s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2_high(jd, iptr, REG_ITMP2);
+                       M_CMP(s1, s2);
+                       M_EOR(REG_ITMP3, REG_ITMP3, REG_ITMP3);
+                       M_MOVGT_IMM(2, REG_ITMP3);
+                       M_MOVEQ_IMM(1, REG_ITMP3);
+
+                       /* low compare: x=x-1(ifLO) */
+                       s1 = emit_load_s1_low(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2_low(jd, iptr, REG_ITMP2);
+                       M_CMP(s1, s2);
+                       M_ADDHI_IMM(REG_ITMP3, REG_ITMP3, 1);
+
+                       /* branch if (x LE 1) */
+                       M_CMP_IMM(REG_ITMP3, 1);
+                       emit_ble(cd, iptr->dst.block);
+                       break;
+
+               case ICMD_IF_LCMPGT:    /* ..., value, value ==> ...                  */
+                                       /* op1 = target JavaVM pc                     */
+
+                       /* high compare: x=0(ifLT) ; x=1(ifEQ) ; x=2(ifGT) */
+                       s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2_high(jd, iptr, REG_ITMP2);
+                       M_CMP(s1, s2);
+                       M_EOR(REG_ITMP3, REG_ITMP3, REG_ITMP3);
+                       M_MOVGT_IMM(2, REG_ITMP3);
+                       M_MOVEQ_IMM(1, REG_ITMP3);
+
+                       /* low compare: x=x-1(ifLO) */
+                       s1 = emit_load_s1_low(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2_low(jd, iptr, REG_ITMP2);
+                       M_CMP(s1, s2);
+                       M_ADDHI_IMM(REG_ITMP3, REG_ITMP3, 1);
+
+                       /* branch if (x GT 1) */
+                       M_CMP_IMM(REG_ITMP3, 1);
+                       emit_bgt(cd, iptr->dst.block);
+                       break;
+
+               case ICMD_IF_LCMPGE:    /* ..., value, value ==> ...                  */
+                                       /* op1 = target JavaVM pc                     */
+
+                       /* high compare: x=0(ifLT) ; x=1(ifEQ) ; x=2(ifGT) */
+                       s1 = emit_load_s1_high(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2_high(jd, iptr, REG_ITMP2);
+                       M_CMP(s1, s2);
+                       M_EOR(REG_ITMP3, REG_ITMP3, REG_ITMP3);
+                       M_MOVGT_IMM(2, REG_ITMP3);
+                       M_MOVEQ_IMM(1, REG_ITMP3);
+
+                       /* low compare: x=x-1(ifLO) */
+                       s1 = emit_load_s1_low(jd, iptr, REG_ITMP1);
+                       s2 = emit_load_s2_low(jd, iptr, REG_ITMP2);
+                       M_CMP(s1, s2);
+                       M_SUBLO_IMM(REG_ITMP3, REG_ITMP3, 1);
+
+                       /* branch if (x GE 1) */
+                       M_CMP_IMM(REG_ITMP3, 1);
+                       emit_bge(cd, iptr->dst.block);
                        break;
 
                case ICMD_TABLESWITCH:  /* ..., index ==> ...                         */
@@ -1972,9 +1997,8 @@ bool codegen(jitdata *jd)
 
                        /* range check (index <= high-low) */
                        i = i - l + 1;
-                       M_COMPARE(REG_ITMP1, i-1, UNCOND, 0);
-                       M_BHI(0); /* unsigned greater than */
-                       codegen_addreference(cd, table[0].block);
+                       M_COMPARE(REG_ITMP1, i-1);
+                       emit_bugt(cd, table[0].block);
 
                        /* build jump table top down and use address of lowest entry */
 
@@ -2006,28 +2030,28 @@ bool codegen(jitdata *jd)
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
 
                        while (--i >= 0) {
-                               M_COMPARE(s1, lookup->value, UNCOND, 0);
-                               M_BEQ(0);
-                               codegen_addreference(cd, lookup->target.block);
+                               M_COMPARE(s1, lookup->value);
+                               emit_beq(cd, lookup->target.block);
                                lookup++;
                        }
 
                        /* default branch */
-                       M_B(0);
-                       codegen_addreference(cd, iptr->sx.s23.s3.lookupdefault.block);
+                       emit_br(cd, iptr->sx.s23.s3.lookupdefault.block);
                        }
                        break;
 
                case ICMD_FRETURN:      /* ..., retvalue ==> ...                      */
 
 #if !defined(ENABLE_SOFTFLOAT)
+                       REPLACEMENT_POINT_RETURN(cd, iptr);
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
-                       M_CAST_FLT_TO_INT_TYPED(VAROP(iptr->s1)->type, s1, REG_RESULT);
+                       M_CAST_F2I(s1, REG_RESULT);
                        goto ICMD_RETURN_do;
 #endif
 
                case ICMD_IRETURN:      /* ..., retvalue ==> ...                      */
 
+                       REPLACEMENT_POINT_RETURN(cd, iptr);
                        s1 = emit_load_s1(jd, iptr, REG_RESULT);
                        M_INTMOVE(s1, REG_RESULT);
                        goto ICMD_RETURN_do;
@@ -2035,31 +2059,33 @@ bool codegen(jitdata *jd)
                case ICMD_DRETURN:      /* ..., retvalue ==> ...                      */
 
 #if !defined(ENABLE_SOFTFLOAT)
+                       REPLACEMENT_POINT_RETURN(cd, iptr);
                        s1 = emit_load_s1(jd, iptr, REG_FTMP1);
-                       M_CAST_FLT_TO_INT_TYPED(VAROP(iptr->s1)->type, s1, REG_RESULT_PACKED);
+                       M_CAST_D2L(s1, REG_RESULT_PACKED);
                        goto ICMD_RETURN_do;
 #endif
 
                case ICMD_LRETURN:      /* ..., retvalue ==> ...                      */
 
+                       REPLACEMENT_POINT_RETURN(cd, iptr);
                        s1 = emit_load_s1(jd, iptr, REG_RESULT_PACKED);
                        M_LNGMOVE(s1, REG_RESULT_PACKED);
                        goto ICMD_RETURN_do;
 
                case ICMD_ARETURN:      /* ..., retvalue ==> ...                      */
 
+                       REPLACEMENT_POINT_RETURN(cd, iptr);
                        s1 = emit_load_s1(jd, iptr, REG_RESULT);
                        M_INTMOVE(s1, REG_RESULT);
                        if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
-                               codegen_addpatchref(cd, PATCHER_athrow_areturn,
+                               patcher_add_patch_ref(jd, PATCHER_resolve_class,
                                                                        iptr->sx.s23.s2.uc, 0);
-
-                               if (opt_showdisassemble)
-                                       M_NOP;
                        }
                        goto ICMD_RETURN_do;
 
                case ICMD_RETURN:       /* ...  ==> ...                               */
+
+                       REPLACEMENT_POINT_RETURN(cd, iptr);
                        ICMD_RETURN_do:
 
 #if !defined(NDEBUG)
@@ -2070,10 +2096,10 @@ bool codegen(jitdata *jd)
 #if defined(ENABLE_THREADS)
                        /* call monitorexit function */
 
-                       if (checksync && (m->flags & ACC_SYNCHRONIZED)) {
+                       if (checksync && code_is_synchronized(code)) {
                                /* stack offset for monitor argument */
 
-                               s1 = rd->memuse;
+                               s1 = rd->memuse * 8;
 
                                /* we need to save the proper return value */
 
@@ -2084,11 +2110,11 @@ bool codegen(jitdata *jd)
                                case ICMD_FRETURN: /* XXX TWISTI: is that correct? */
                                case ICMD_DRETURN:
                                        M_STMFD(BITMASK_RESULT, REG_SP);
-                                       s1 += 2;
+                                       s1 += 2 * 4;
                                        break;
                                }
 
-                               M_LDR(REG_A0, REG_SP, s1 * 4);
+                               M_LDR(REG_A0, REG_SP, s1);
                                disp = dseg_add_functionptr(cd, LOCK_monitor_exit);
                                M_DSEG_BRANCH(disp);
 
@@ -2110,13 +2136,13 @@ bool codegen(jitdata *jd)
 
                        /* deallocate stackframe for spilled variables */
 
-                       if ((cd->stackframesize - savedregs_num) > 0)
-                               M_ADD_IMM_EXT_MUL4(REG_SP, REG_SP, cd->stackframesize - savedregs_num);
+                       if ((cd->stackframesize / 4 - savedregs_num) > 0)
+                               M_ADD_IMM_EXT_MUL4(REG_SP, REG_SP, cd->stackframesize / 4 - savedregs_num);
 
                        /* restore callee saved registers + do return */
 
                        if (savedregs_bitmask) {
-                               if (!jd->isleafmethod) {
+                               if (!code_is_leafmethod(code)) {
                                        savedregs_bitmask &= ~(1<<REG_LR);
                                        savedregs_bitmask |= (1<<REG_PC);
                                }
@@ -2125,7 +2151,7 @@ bool codegen(jitdata *jd)
 
                        /* if LR was not on stack, we need to return manually */
 
-                       if (jd->isleafmethod)
+                       if (code_is_leafmethod(code))
                                M_MOV(REG_PC, REG_LR);
                        break;
 
@@ -2140,6 +2166,8 @@ bool codegen(jitdata *jd)
                case ICMD_INVOKEVIRTUAL:/* op1 = arg count, val.a = method pointer    */
                case ICMD_INVOKEINTERFACE:
 
+                       REPLACEMENT_POINT_INVOKE(cd, iptr);
+
                        if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
                                lm = NULL;
                                um = iptr->sx.s23.s3.um;
@@ -2160,6 +2188,7 @@ bool codegen(jitdata *jd)
 
                        for (s3 = s3 - 1; s3 >= 0; s3--) {
                                var = VAR(iptr->sx.s23.s2.args[s3]);
+                               d   = md->params[s3].regoff;
 
                                if (var->flags & PREALLOC) /* argument was precolored? */
                                        continue;
@@ -2169,43 +2198,39 @@ bool codegen(jitdata *jd)
                                if (IS_INT_LNG_TYPE(var->type)) {
 #endif /* !defined(ENABLE_SOFTFLOAT) */
                                        if (!md->params[s3].inmemory) {
-                                               s1 = ARGUMENT_REGS(var->type, md->params[s3].regoff);
-                                               SPLIT_OPEN(var->type, s1, REG_ITMP2);
-                                               d = emit_load(jd, iptr, var, s1);
+                                               s1 = emit_load(jd, iptr, var, d);
 
                                                if (IS_2_WORD_TYPE(var->type))
-                                                       M_LNGMOVE(d, s1);
+                                                       M_LNGMOVE(s1, d);
                                                else
-                                                       M_INTMOVE(d, s1);
-
-                                               SPLIT_STORE_AND_CLOSE(var->type, s1, 0);
+                                                       M_INTMOVE(s1, d);
                                        }
                                        else {
                                                if (IS_2_WORD_TYPE(var->type)) {
-                                                       d = emit_load(jd, iptr, var, REG_ITMP12_PACKED);
-                                                       M_LST(d, REG_SP, md->params[s3].regoff * 4);
+                                                       s1 = emit_load(jd, iptr, var, REG_ITMP12_PACKED);
+                                                       M_LST(s1, REG_SP, d);
                                                }
                                                else {
-                                                       d = emit_load(jd, iptr, var, REG_ITMP1);
-                                                       M_IST(d, REG_SP, md->params[s3].regoff * 4);
+                                                       s1 = emit_load(jd, iptr, var, REG_ITMP1);
+                                                       M_IST(s1, REG_SP, d);
                                                }
                                        }
 #if !defined(ENABLE_SOFTFLOAT)
                                }
                                else {
                                        if (!md->params[s3].inmemory) {
-                                               s1 = ARGUMENT_REGS(var->type, md->params[s3].regoff);
-                                               d = emit_load(jd, iptr, var, REG_FTMP1);
-                                               SPLIT_OPEN(var->type, s1, REG_ITMP1);
-                                               M_CAST_FLT_TO_INT_TYPED(var->type, d, s1);
-                                               SPLIT_STORE_AND_CLOSE(var->type, s1, 0);
+                                               s1 = emit_load(jd, iptr, var, REG_FTMP1);
+                                               if (IS_2_WORD_TYPE(var->type))
+                                                       M_CAST_D2L(s1, d);
+                                               else
+                                                       M_CAST_F2I(s1, d);
                                        }
                                        else {
-                                               d = emit_load(jd, iptr, var, REG_FTMP1);
+                                               s1 = emit_load(jd, iptr, var, REG_FTMP1);
                                                if (IS_2_WORD_TYPE(var->type))
-                                                       M_DST(d, REG_SP, md->params[s3].regoff * 4);
+                                                       M_DST(s1, REG_SP, d);
                                                else
-                                                       M_FST(d, REG_SP, md->params[s3].regoff * 4);
+                                                       M_FST(s1, REG_SP, d);
                                        }
                                }
 #endif /* !defined(ENABLE_SOFTFLOAT) */
@@ -2213,41 +2238,50 @@ bool codegen(jitdata *jd)
 
                        switch (iptr->opc) {
                        case ICMD_BUILTIN:
-                               disp = dseg_add_functionptr(cd, bte->fp);
 
-                               M_DSEG_LOAD(REG_PV, disp); /* Pointer to built-in-function */
+                               if (bte->stub == NULL) {
+                                       disp = dseg_add_functionptr(cd, bte->fp);
+                               } else {
+                                       disp = dseg_add_functionptr(cd, bte->stub);
+                               }
+
+                               M_DSEG_LOAD(REG_PV, disp); /* pointer to built-in-function */
+
+                               /* generate the actual call */
+
+                               M_MOV(REG_LR, REG_PC);
+                               M_MOV(REG_PC, REG_PV);
+                               s1 = (s4) (cd->mcodeptr - cd->mcodebase);
+                               M_RECOMPUTE_PV(s1);
                                break;
 
                        case ICMD_INVOKESPECIAL:
-                               M_TST(REG_A0, REG_A0);
-                               M_BEQ(0);
-                               codegen_add_nullpointerexception_ref(cd);
+                               emit_nullpointer_check(cd, iptr, REG_A0);
                                /* fall through */
 
                        case ICMD_INVOKESTATIC:
                                if (lm == NULL) {
                                        disp = dseg_add_unique_address(cd, NULL);
 
-                                       codegen_addpatchref(cd, PATCHER_invokestatic_special,
+                                       patcher_add_patch_ref(jd, PATCHER_invokestatic_special,
                                                                                um, disp);
-
-                                       if (opt_showdisassemble)
-                                               M_NOP;
                                }
                                else
                                        disp = dseg_add_address(cd, lm->stubroutine);
 
                                M_DSEG_LOAD(REG_PV, disp);            /* Pointer to method */
+
+                               /* generate the actual call */
+
+                               M_MOV(REG_LR, REG_PC);
+                               M_MOV(REG_PC, REG_PV);
+                               s1 = (s4) (cd->mcodeptr - cd->mcodebase);
+                               M_RECOMPUTE_PV(s1);
                                break;
 
                        case ICMD_INVOKEVIRTUAL:
-                               gen_nullptr_check(REG_A0);
-
                                if (lm == NULL) {
-                                       codegen_addpatchref(cd, PATCHER_invokevirtual, um, 0);
-
-                                       if (opt_showdisassemble)
-                                               M_NOP;
+                                       patcher_add_patch_ref(jd, PATCHER_invokevirtual, um, 0);
 
                                        s1 = 0;
                                }
@@ -2255,51 +2289,50 @@ bool codegen(jitdata *jd)
                                        s1 = OFFSET(vftbl_t, table[0]) +
                                                sizeof(methodptr) * lm->vftblindex;
 
+                               /* implicit null-pointer check */
                                M_LDR_INTERN(REG_METHODPTR, REG_A0,
-                                                        OFFSET(java_objectheader, vftbl));
+                                                        OFFSET(java_object_t, vftbl));
                                M_LDR_INTERN(REG_PV, REG_METHODPTR, s1);
+
+                               /* generate the actual call */
+
+                               M_MOV(REG_LR, REG_PC);
+                               M_MOV(REG_PC, REG_PV);
+                               s1 = (s4) (cd->mcodeptr - cd->mcodebase);
+                               M_RECOMPUTE_PV(s1);
                                break;
 
                        case ICMD_INVOKEINTERFACE:
-                               gen_nullptr_check(REG_A0);
-
                                if (lm == NULL) {
-                                       codegen_addpatchref(cd, PATCHER_invokeinterface, um, 0);
-
-                                       if (opt_showdisassemble)
-                                               M_NOP;
+                                       patcher_add_patch_ref(jd, PATCHER_invokeinterface, um, 0);
 
                                        s1 = 0;
                                        s2 = 0;
                                }
                                else {
                                        s1 = OFFSET(vftbl_t, interfacetable[0]) -
-                                               sizeof(methodptr*) * lm->class->index;
-                                       s2 = sizeof(methodptr) * (lm - lm->class->methods);
+                                               sizeof(methodptr*) * lm->clazz->index;
+                                       s2 = sizeof(methodptr) * (lm - lm->clazz->methods);
                                }
 
+                               /* implicit null-pointer check */
                                M_LDR_INTERN(REG_METHODPTR, REG_A0,
-                                                        OFFSET(java_objectheader, vftbl));
+                                                        OFFSET(java_object_t, vftbl));
                                M_LDR_INTERN(REG_METHODPTR, REG_METHODPTR, s1);
                                M_LDR_INTERN(REG_PV, REG_METHODPTR, s2);
-                               break;
-                       }
-
-                       /* generate the actual call */
 
-                       M_MOV(REG_LR, REG_PC);               /* save return address in LR */
-                       M_MOV(REG_PC, REG_PV);               /* branch to method          */
-                       s1 = (s4) (cd->mcodeptr - cd->mcodebase);
-                       M_RECOMPUTE_PV(s1);
+                               /* generate the actual call */
 
-                       /* actually only used for ICMD_BUILTIN */
-
-                       if (INSTRUCTION_MUST_CHECK(iptr)) {
-                               M_TST(REG_RESULT, REG_RESULT);
-                               M_BEQ(0);
-                               codegen_add_fillinstacktrace_ref(cd);
+                               M_MOV(REG_LR, REG_PC);
+                               M_MOV(REG_PC, REG_PV);
+                               s1 = (s4) (cd->mcodeptr - cd->mcodebase);
+                               M_RECOMPUTE_PV(s1);
+                               break;
                        }
 
+                       /* store size of call code in replacement point */
+                       REPLACEMENT_POINT_INVOKE_RETURN(cd, iptr);
+
                        /* store return value */
 
                        d = md->returntype.type;
@@ -2310,7 +2343,7 @@ bool codegen(jitdata *jd)
                           our ENABLE_SOFTFLOAT define */
                        if (iptr->opc == ICMD_BUILTIN && d != TYPE_VOID && IS_FLT_DBL_TYPE(d)) {
 #if 0 && !defined(NDEBUG)
-                               dolog("BUILTIN that returns float or double (%s.%s)", m->class->name->text, m->name->text);
+                               dolog("BUILTIN that returns float or double (%s.%s)", m->clazz->name->text, m->name->text);
 #endif
                                /* we cannot use this macro, since it is not defined
                                   in ENABLE_SOFTFLOAT M_CAST_FLT_TO_INT_TYPED(d,
@@ -2341,7 +2374,10 @@ bool codegen(jitdata *jd)
 #if !defined(ENABLE_SOFTFLOAT)
                                } else {
                                        s1 = codegen_reg_of_dst(jd, iptr, REG_FTMP1);
-                                       M_CAST_INT_TO_FLT_TYPED(VAROP(iptr->dst)->type, REG_RESULT_TYPED(VAROP(iptr->dst)->type), s1);
+                                       if (IS_2_WORD_TYPE(d))
+                                               M_CAST_L2D(REG_RESULT_PACKED, s1);
+                                       else
+                                               M_CAST_I2F(REG_RESULT, s1);
                                }
 #endif /* !defined(ENABLE_SOFTFLOAT) */
 
@@ -2350,16 +2386,12 @@ bool codegen(jitdata *jd)
                        break;
 
                case ICMD_CHECKCAST:  /* ..., objectref ==> ..., objectref            */
-                                     /* val.a: (classinfo*) superclass               */
 
                        if (!(iptr->flags.bits & INS_FLAG_ARRAY)) {
                                /* object type cast-check */
 
                        classinfo *super;
                        s4         superindex;
-                       u1        *branch1 = NULL;
-                       u1        *branch2 = NULL;
-                       u1        *branch3 = NULL;
 
                        if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
                                super      = NULL;
@@ -2370,123 +2402,125 @@ bool codegen(jitdata *jd)
                                superindex = super->index;
                        }
 
-#if defined(ENABLE_THREADS)
-                       codegen_threadcritrestart(cd, cd->mcodeptr - cd->mcodebase);
-#endif
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
 
                        /* if class is not resolved, check which code to call */
 
                        if (super == NULL) {
                                M_TST(s1, s1);
-                               M_BEQ(0);
-                               branch1 = cd->mcodeptr;
+                               emit_label_beq(cd, BRANCH_LABEL_1);
 
                                disp = dseg_add_unique_s4(cd, 0); /* super->flags */
-                               codegen_addpatchref(cd, PATCHER_checkcast_instanceof_flags,
+                               patcher_add_patch_ref(jd, PATCHER_resolve_classref_to_flags,
                                                    iptr->sx.s23.s3.c.ref, disp);
 
-                               if (opt_showdisassemble)
-                                       M_NOP;
-
                                M_DSEG_LOAD(REG_ITMP2, disp);
                                disp = dseg_add_s4(cd, ACC_INTERFACE);
                                M_DSEG_LOAD(REG_ITMP3, disp);
                                M_TST(REG_ITMP2, REG_ITMP3);
-                               M_BEQ(0);
-                               branch2 = cd->mcodeptr;
+                               emit_label_beq(cd, BRANCH_LABEL_2);
                        }
 
                        /* interface checkcast code */
 
                        if ((super == NULL) || (super->flags & ACC_INTERFACE)) {
+                               if ((super == NULL) || !IS_IMM(superindex)) {
+                                       disp = dseg_add_unique_s4(cd, superindex);
+                               }
                                if (super == NULL) {
-                                       codegen_addpatchref(cd,
-                                                           PATCHER_checkcast_instanceof_interface,
-                                                           iptr->sx.s23.s3.c.ref, 0);
-
-                                       if (opt_showdisassemble)
-                                               M_NOP;
+                                       patcher_add_patch_ref(jd, PATCHER_resolve_classref_to_index,
+                                                           iptr->sx.s23.s3.c.ref, disp);
                                }
                                else {
                                        M_TST(s1, s1);
-                                       M_BEQ(0);
-                                       branch1 = cd->mcodeptr;
+                                       emit_label_beq(cd, BRANCH_LABEL_3);
                                }
 
-                               M_LDR_INTERN(REG_ITMP2, s1, OFFSET(java_objectheader, vftbl));
+                               M_LDR_INTERN(REG_ITMP2, s1, OFFSET(java_object_t, vftbl));
                                M_LDR_INTERN(REG_ITMP3, REG_ITMP2, OFFSET(vftbl_t, interfacetablelength));
-                               assert(IS_IMM(superindex));
-                               M_CMP_IMM(REG_ITMP3, superindex);
-                               M_BLE(0);
-                               codegen_add_classcastexception_ref(cd, s1);
 
-                               s2 = OFFSET(vftbl_t, interfacetable[0]) -
-                                       superindex * sizeof(methodptr*);
+                               /* we put unresolved or non-immediate superindices onto dseg */
+                               if ((super == NULL) || !IS_IMM(superindex)) {
+                                       /* disp was computed before we added the patcher */
+                                       M_DSEG_LOAD(REG_ITMP2, disp);
+                                       M_CMP(REG_ITMP3, REG_ITMP2);
+                               } else {
+                                       assert(IS_IMM(superindex));
+                                       M_CMP_IMM(REG_ITMP3, superindex);
+                               }
 
-                               M_LDR_INTERN(REG_ITMP3, REG_ITMP2, s2);
-                               M_TST(REG_ITMP3, REG_ITMP3);
-                               M_BEQ(0);
-                               codegen_add_classcastexception_ref(cd, s1);
+                               emit_classcast_check(cd, iptr, BRANCH_LE, REG_ITMP3, s1);
+
+                               /* if we loaded the superindex out of the dseg above, we do
+                                  things differently here! */
+                               if ((super == NULL) || !IS_IMM(superindex)) {
+
+                                       M_LDR_INTERN(REG_ITMP3, s1, OFFSET(java_object_t, vftbl));
+
+                                       /* this assumes something */
+                                       assert(OFFSET(vftbl_t, interfacetable[0]) == 0);
+
+                                       /* this does: REG_ITMP3 - superindex * sizeof(methodptr*) */
+                                       assert(sizeof(methodptr*) == 4);
+                                       M_SUB(REG_ITMP2, REG_ITMP3, REG_LSL(REG_ITMP2, 2));
+
+                                       s2 = 0;
+
+                               } else {
+
+                                       s2 = OFFSET(vftbl_t, interfacetable[0]) -
+                                                               superindex * sizeof(methodptr*);
 
-                               if (super == NULL) {
-                                       M_B(0);
-                                       branch3 = cd->mcodeptr;
                                }
-                       }
 
-                       if (branch2) {
-                               gen_resolvebranch(branch2, branch2 - cd->mcodebase,
-                                                                 cd->mcodeptr - cd->mcodebase);
+                               M_LDR_INTERN(REG_ITMP3, REG_ITMP2, s2);
+                               M_TST(REG_ITMP3, REG_ITMP3);
+                               emit_classcast_check(cd, iptr, BRANCH_EQ, REG_ITMP3, s1);
+
+                               if (super == NULL)
+                                       emit_label_br(cd, BRANCH_LABEL_4);
+                               else
+                                       emit_label(cd, BRANCH_LABEL_3);
                        }
 
                        /* class checkcast code */
 
                        if ((super == NULL) || !(super->flags & ACC_INTERFACE)) {
                                if (super == NULL) {
+                                       emit_label(cd, BRANCH_LABEL_2);
+
                                        disp = dseg_add_unique_address(cd, NULL);
 
-                                       codegen_addpatchref(cd, PATCHER_checkcast_instanceof_class,
+                                       patcher_add_patch_ref(jd, PATCHER_resolve_classref_to_vftbl,
                                                            iptr->sx.s23.s3.c.ref,
                                                                                disp);
-
-                                       if (opt_showdisassemble)
-                                               M_NOP;
                                }
                                else {
                                        disp = dseg_add_address(cd, super->vftbl);
 
                                        M_TST(s1, s1);
-                                       M_BEQ(0);
-                                       branch1 = cd->mcodeptr;
+                                       emit_label_beq(cd, BRANCH_LABEL_5);
                                }
 
-                               M_LDR_INTERN(REG_ITMP2, s1, OFFSET(java_objectheader, vftbl));
+                               M_LDR_INTERN(REG_ITMP2, s1, OFFSET(java_object_t, vftbl));
                                M_DSEG_LOAD(REG_ITMP3, disp);
-#if defined(ENABLE_THREADS)
-                               codegen_threadcritstart(cd, cd->mcodeptr - cd->mcodebase);
-#endif
+
                                M_LDR_INTERN(REG_ITMP2, REG_ITMP2, OFFSET(vftbl_t, baseval));
                                M_LDR_INTERN(REG_ITMP3, REG_ITMP3, OFFSET(vftbl_t, baseval));
                                M_SUB(REG_ITMP2, REG_ITMP2, REG_ITMP3);
                                M_DSEG_LOAD(REG_ITMP3, disp);
                                M_LDR_INTERN(REG_ITMP3, REG_ITMP3, OFFSET(vftbl_t, diffval));
-#if defined(ENABLE_THREADS)
-                               codegen_threadcritstop(cd, cd->mcodeptr - cd->mcodebase);
-#endif
+
                                M_CMP(REG_ITMP2, REG_ITMP3);
-                               M_BHI(0);
-                               codegen_add_classcastexception_ref(cd, s1);
-                       }
+                               emit_classcast_check(cd, iptr, BRANCH_UGT, 0, s1);
 
-                       if (branch1) {
-                               gen_resolvebranch(branch1, branch1 - cd->mcodebase,
-                                                                 cd->mcodeptr - cd->mcodebase);
+                               if (super != NULL)
+                                       emit_label(cd, BRANCH_LABEL_5);
                        }
 
-                       if (branch3) {
-                               gen_resolvebranch(branch3, branch3 - cd->mcodebase,
-                                                                 cd->mcodeptr - cd->mcodebase);
+                       if (super == NULL) {
+                               emit_label(cd, BRANCH_LABEL_1);
+                               emit_label(cd, BRANCH_LABEL_4);
                        }
 
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP1);
@@ -2500,12 +2534,9 @@ bool codegen(jitdata *jd)
                                if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
                                        disp = dseg_add_unique_address(cd, NULL);
 
-                                       codegen_addpatchref(cd, PATCHER_builtin_arraycheckcast,
+                                       patcher_add_patch_ref(jd, PATCHER_resolve_classref_to_classinfo,
                                                                                iptr->sx.s23.s3.c.ref,
                                                                                disp);
-
-                                       if (opt_showdisassemble)
-                                               M_NOP;
                                }
                                else
                                        disp = dseg_add_address(cd, iptr->sx.s23.s3.c.cls);
@@ -2520,8 +2551,7 @@ bool codegen(jitdata *jd)
 
                                s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                                M_TST(REG_RESULT, REG_RESULT);
-                               M_BEQ(0);
-                               codegen_add_classcastexception_ref(cd, s1);
+                               emit_classcast_check(cd, iptr, BRANCH_EQ, REG_RESULT, s1);
 
                                d = codegen_reg_of_dst(jd, iptr, s1);
                        }
@@ -2531,13 +2561,10 @@ bool codegen(jitdata *jd)
                        break;
 
                case ICMD_INSTANCEOF: /* ..., objectref ==> ..., intresult            */
-                                     /* val.a: (classinfo*) superclass               */
+
                        {
                        classinfo *super;
                        s4         superindex;
-                       u1        *branch1 = NULL;
-                       u1        *branch2 = NULL;
-                       u1        *branch3 = NULL;
 
                        if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
                                super      = NULL;
@@ -2548,11 +2575,9 @@ bool codegen(jitdata *jd)
                                superindex = super->index;
                        }
 
-#if defined(ENABLE_THREADS)
-                       codegen_threadcritrestart(cd, cd->mcodeptr - cd->mcodebase);
-#endif
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
                        d = codegen_reg_of_dst(jd, iptr, REG_ITMP2);
+
                        if (s1 == d) {
                                M_MOV(REG_ITMP1, s1);
                                s1 = REG_ITMP1;
@@ -2562,122 +2587,134 @@ bool codegen(jitdata *jd)
 
                        if (super == NULL) {
                                M_EOR(d, d, d);
+
                                M_TST(s1, s1);
-                               M_BEQ(0);
-                               branch1 = cd->mcodeptr;
+                               emit_label_beq(cd, BRANCH_LABEL_1);
 
                                disp = dseg_add_unique_s4(cd, 0); /* super->flags */
-                               codegen_addpatchref(cd, PATCHER_checkcast_instanceof_flags,
+                               patcher_add_patch_ref(jd, PATCHER_resolve_classref_to_flags,
                                                    iptr->sx.s23.s3.c.ref, disp);
 
-                               if (opt_showdisassemble)
-                                       M_NOP;
-
                                M_DSEG_LOAD(REG_ITMP2, disp);
                                disp = dseg_add_s4(cd, ACC_INTERFACE);
                                M_DSEG_LOAD(REG_ITMP3, disp);
                                M_TST(REG_ITMP2, REG_ITMP3);
-                               M_BEQ(0);
-                               branch2 = cd->mcodeptr;
+                               emit_label_beq(cd, BRANCH_LABEL_2);
                        }
 
                        /* interface checkcast code */
 
                        if ((super == NULL) || (super->flags & ACC_INTERFACE)) {
+                               if ((super == NULL) || !IS_IMM(superindex)) {
+                                       disp = dseg_add_unique_s4(cd, superindex);
+                               }
                                if (super == NULL) {
                                        /* If d == REG_ITMP2, then it's destroyed in check
                                           code above.  */
                                        if (d == REG_ITMP2)
                                                M_EOR(d, d, d);
 
-                                       codegen_addpatchref(cd,
-                                                           PATCHER_checkcast_instanceof_interface,
-                                                           iptr->sx.s23.s3.c.ref, 0);
-
-                                       if (opt_showdisassemble)
-                                               M_NOP;
+                                       patcher_add_patch_ref(jd, PATCHER_resolve_classref_to_index,
+                                                           iptr->sx.s23.s3.c.ref, disp);
                                }
                                else {
                                        M_EOR(d, d, d);
                                        M_TST(s1, s1);
-                                       M_BEQ(0);
-                                       branch1 = cd->mcodeptr;
+                                       emit_label_beq(cd, BRANCH_LABEL_3);
                                }
 
-                               M_LDR_INTERN(REG_ITMP1, s1, OFFSET(java_objectheader, vftbl));
+                               M_LDR_INTERN(REG_ITMP1, s1, OFFSET(java_object_t, vftbl));
                                M_LDR_INTERN(REG_ITMP3,
                                                         REG_ITMP1, OFFSET(vftbl_t, interfacetablelength));
-                               assert(IS_IMM(superindex));
-                               M_CMP_IMM(REG_ITMP3, superindex);
-                               M_BLE(2);
 
-                               s2 = OFFSET(vftbl_t, interfacetable[0]) -
-                                       superindex * sizeof(methodptr*);
+                               /* we put unresolved or non-immediate superindices onto dseg
+                                  and do things slightly different */
+                               if ((super == NULL) || !IS_IMM(superindex)) {
+                                       /* disp was computed before we added the patcher */
+                                       M_DSEG_LOAD(REG_ITMP2, disp);
+                                       M_CMP(REG_ITMP3, REG_ITMP2);
+
+                                       if (d == REG_ITMP2) {
+                                               M_EORLE(d, d, d);
+                                               M_BLE(4);
+                                       } else {
+                                               M_BLE(3);
+                                       }
 
-                               M_LDR_INTERN(REG_ITMP3, REG_ITMP1, s2);
-                               M_TST(REG_ITMP3, REG_ITMP3);
-                               M_MOVNE_IMM(d, 1);
+                                       /* this assumes something */
+                                       assert(OFFSET(vftbl_t, interfacetable[0]) == 0);
+
+                                       /* this does: REG_ITMP3 - superindex * sizeof(methodptr*) */
+                                       assert(sizeof(methodptr*) == 4);
+                                       M_SUB(REG_ITMP1, REG_ITMP1, REG_LSL(REG_ITMP2, 2));
+
+                                       if (d == REG_ITMP2) {
+                                               M_EOR(d, d, d);
+                                       }
+
+                                       s2 = 0;
+
+                               } else {
+                                       assert(IS_IMM(superindex));
+                                       M_CMP_IMM(REG_ITMP3, superindex);
+
+                                       M_BLE(2);
+
+                                       s2 = OFFSET(vftbl_t, interfacetable[0]) -
+                                               superindex * sizeof(methodptr*);
 
-                               if (super == NULL) {
-                                       M_B(0);
-                                       branch3 = cd->mcodeptr;
                                }
-                       }
 
-                       if (branch2) {
-                               gen_resolvebranch(branch2, branch2 - cd->mcodebase,
-                                                                 cd->mcodeptr - cd->mcodebase);
+                               M_LDR_INTERN(REG_ITMP3, REG_ITMP1, s2);
+                               M_TST(REG_ITMP3, REG_ITMP3);
+                               M_MOVNE_IMM(1, d);
+
+                               if (super == NULL)
+                                       emit_label_br(cd, BRANCH_LABEL_4);
+                               else
+                                       emit_label(cd, BRANCH_LABEL_3);
                        }
 
                        /* class checkcast code */
 
                        if ((super == NULL) || !(super->flags & ACC_INTERFACE)) {
                                if (super == NULL) {
-                                       disp = dseg_add_unique_address(cd, NULL);
+                                       emit_label(cd, BRANCH_LABEL_2);
 
-                                       codegen_addpatchref(cd, PATCHER_checkcast_instanceof_class,
-                                                           iptr->sx.s23.s3.c.ref,
-                                                                               disp);
+                                       disp = dseg_add_unique_address(cd, NULL);
 
-                                       if (opt_showdisassemble)
-                                               M_NOP;
+                                       patcher_add_patch_ref(jd, PATCHER_resolve_classref_to_vftbl,
+                                                           iptr->sx.s23.s3.c.ref, disp);
                                }
                                else {
                                        disp = dseg_add_address(cd, super->vftbl);
 
                                        M_EOR(d, d, d);
                                        M_TST(s1, s1);
-                                       M_BEQ(0);
-                                       branch1 = cd->mcodeptr;
+                                       emit_label_beq(cd, BRANCH_LABEL_5);
                                }
 
-                               M_LDR_INTERN(REG_ITMP1, s1, OFFSET(java_objectheader, vftbl));
+                               M_LDR_INTERN(REG_ITMP1, s1, OFFSET(java_object_t, vftbl));
                                M_DSEG_LOAD(REG_ITMP2, disp);
-#if defined(ENABLE_THREADS)
-                               codegen_threadcritstart(cd, cd->mcodeptr - cd->mcodebase);
-#endif
+
                                M_LDR_INTERN(REG_ITMP1, REG_ITMP1, OFFSET(vftbl_t, baseval));
                                M_LDR_INTERN(REG_ITMP3, REG_ITMP2, OFFSET(vftbl_t, baseval));
                                M_LDR_INTERN(REG_ITMP2, REG_ITMP2, OFFSET(vftbl_t, diffval));
-#if defined(ENABLE_THREADS)
-                               codegen_threadcritstop(cd, cd->mcodeptr - cd->mcodebase);
-#endif
+
                                M_SUB(REG_ITMP1, REG_ITMP1, REG_ITMP3);
                                M_CMP(REG_ITMP1, REG_ITMP2);
                                /* If d == REG_ITMP2, then it's destroyed */
                                if (d == REG_ITMP2)
                                        M_EOR(d, d, d);
-                               M_MOVLS_IMM(d, 1);
-                       }
+                               M_MOVLS_IMM(1, d);
 
-                       if (branch1) {
-                               gen_resolvebranch(branch1, branch1 - cd->mcodebase,
-                                                                 cd->mcodeptr - cd->mcodebase);
+                               if (super != NULL)
+                                       emit_label(cd, BRANCH_LABEL_5);
                        }
 
-                       if (branch3) {
-                               gen_resolvebranch(branch3, branch3 - cd->mcodebase,
-                                                                 cd->mcodeptr - cd->mcodebase);
+                       if (super == NULL) {
+                               emit_label(cd, BRANCH_LABEL_1);
+                               emit_label(cd, BRANCH_LABEL_4);
                        }
 
                        }
@@ -2713,11 +2750,8 @@ bool codegen(jitdata *jd)
                        if (INSTRUCTION_IS_UNRESOLVED(iptr)) {
                                disp = dseg_add_unique_address(cd, NULL);
 
-                               codegen_addpatchref(cd, PATCHER_builtin_multianewarray,
+                               patcher_add_patch_ref(jd, PATCHER_resolve_classref_to_classinfo,
                                                                        iptr->sx.s23.s3.c.ref, disp);
-
-                               if (opt_showdisassemble)
-                                       M_NOP;
                        }
                        else
                                disp = dseg_add_address(cd, iptr->sx.s23.s3.c.cls);
@@ -2742,9 +2776,7 @@ bool codegen(jitdata *jd)
 
                        /* check for exception before result assignment */
 
-                       M_TST(REG_RESULT, REG_RESULT);
-                       M_BEQ(0);
-                       codegen_add_fillinstacktrace_ref(cd);
+                       emit_exception_check(cd, iptr);
 
                        /* get arrayref */
 
@@ -2756,9 +2788,7 @@ bool codegen(jitdata *jd)
                case ICMD_CHECKNULL:  /* ..., objectref  ==> ..., objectref           */
 
                        s1 = emit_load_s1(jd, iptr, REG_ITMP1);
-                       M_TST(s1, s1);
-                       M_BEQ(0);
-                       codegen_add_nullpointerexception_ref(cd);
+                       emit_nullpointer_check(cd, iptr, s1);
                        break;
 
                default:
@@ -2771,15 +2801,9 @@ bool codegen(jitdata *jd)
 
        } /* for all basic blocks */
 
-       dseg_createlinenumbertable(cd);
-
+       /* generate traps */
 
-       /* generate exception and patcher stubs */
-
-       emit_exception_stubs(jd);
-       emit_patcher_stubs(jd);
-
-       codegen_finish(jd);
+       emit_patcher_traps(jd);
 
        /* everything's ok */
 
@@ -2787,142 +2811,95 @@ bool codegen(jitdata *jd)
 }
 
 
-/* createcompilerstub **********************************************************
-
-   creates a stub routine which calls the compiler
+/* codegen_emit_stub_compiler **************************************************
 
+   Emits a stub routine which calls the compiler.
+       
 *******************************************************************************/
 
-#define COMPILERSTUB_DATASIZE    3 * SIZEOF_VOID_P
-#define COMPILERSTUB_CODESIZE    2 * 4
-
-#define COMPILERSTUB_SIZE        COMPILERSTUB_DATASIZE + COMPILERSTUB_CODESIZE
-
-
-u1 *createcompilerstub(methodinfo *m)
+void codegen_emit_stub_compiler(jitdata *jd)
 {
-       u1          *s;                     /* memory to hold the stub            */
-       ptrint      *d;
+       methodinfo  *m;
        codegendata *cd;
-       s4           dumpsize;              /* code generation pointer            */
-
-       s = CNEW(u1, COMPILERSTUB_SIZE);
-
-       /* set data pointer and code pointer */
-
-       d = (ptrint *) s;
-       s = s + COMPILERSTUB_DATASIZE;
-
-       /* mark start of dump memory area */
-
-       dumpsize = dump_size();
 
-       cd = DNEW(codegendata);
-       cd->mcodeptr = s;
+       /* get required compiler data */
 
-       /* The codeinfo pointer is actually a pointer to the
-          methodinfo. This fakes a codeinfo structure. */
-       
-       d[0] = (ptrint) asm_call_jit_compiler;
-       d[1] = (ptrint) m;
-       d[2] = (ptrint) &d[1];                                    /* fake code->m */
+       m  = jd->m;
+       cd = jd->cd;
 
        /* code for the stub */
 
        M_LDR_INTERN(REG_ITMP1, REG_PC, -(2 * 4 + 2 * SIZEOF_VOID_P));
        M_LDR_INTERN(REG_PC, REG_PC, -(3 * 4 + 3 * SIZEOF_VOID_P));
-
-#if defined(ENABLE_STATISTICS)
-       if (opt_stat)
-               count_cstub_len += COMPILERSTUB_SIZE * 4;
-#endif
-
-       /* release dump area */
-
-       dump_release(dumpsize);
-
-       /* synchronize instruction and data cache */
-
-       md_cacheflush(s, cd->mcodeptr - (u1 *) d);
-
-       return s;
 }
 
 
-/* createnativestub ************************************************************
+/* codegen_emit_stub_native ****************************************************
 
-   Creates a stub routine which calls a native method.
+   Emits a stub routine which calls a native method.
 
 *******************************************************************************/
 
-u1 *createnativestub(functionptr f, jitdata *jd, methoddesc *nmd)
+void codegen_emit_stub_native(jitdata *jd, methoddesc *nmd, functionptr f, int skipparams)
 {
-       methodinfo   *m;
-       codeinfo     *code;
-       codegendata  *cd;
-       registerdata *rd;
-       s4            nativeparams;
-       methoddesc   *md;
-       s4            i, j;
-       s4            t;
-       s4            disp, funcdisp, s1, s2;
+       methodinfo  *m;
+       codeinfo    *code;
+       codegendata *cd;
+       methoddesc  *md;
+       s4           i, j;
+       s4           t;
+       int          s1, s2;
+       int          disp;
 
        /* get required compiler data */
 
        m    = jd->m;
        code = jd->code;
        cd   = jd->cd;
-       rd   = jd->rd;
 
        /* initialize variables */
 
        md = m->parseddesc;
-       nativeparams = (m->flags & ACC_STATIC) ? 2 : 1;
 
        /* calculate stackframe size */
 
-       cd->stackframesize = 
-               1 +                                                /* return address  */
-               sizeof(stackframeinfo) / SIZEOF_VOID_P +           /* stackframeinfo  */
-               sizeof(localref_table) / SIZEOF_VOID_P +           /* localref_table  */
-               nmd->memuse;                                       /* stack arguments */
+       cd->stackframesize =
+               4 +                                                /* return address  */
+               sizeof(stackframeinfo_t) +                         /* stackframeinfo  */
+               sizeof(localref_table) +                           /* localref_table  */
+               nmd->memuse * 4;                                   /* stack arguments */
 
        /* align stack to 8-byte */
 
-       cd->stackframesize = (cd->stackframesize + 1) & ~1;
+       cd->stackframesize = (cd->stackframesize + 4) & ~4;
 
        /* create method header */
 
        (void) dseg_add_unique_address(cd, code);              /* CodeinfoPointer */
-       (void) dseg_add_unique_s4(cd, cd->stackframesize * 4); /* FrameSize       */
-       (void) dseg_add_unique_s4(cd, 0);                      /* IsSync          */
+       (void) dseg_add_unique_s4(cd, cd->stackframesize);     /* FrameSize       */
        (void) dseg_add_unique_s4(cd, 0);                      /* IsLeaf          */
        (void) dseg_add_unique_s4(cd, 0);                      /* IntSave         */
        (void) dseg_add_unique_s4(cd, 0);                      /* FltSave         */
-       (void) dseg_addlinenumbertablesize(cd);
-       (void) dseg_add_unique_s4(cd, 0);                      /* ExTableSize     */
 
        /* generate stub code */
 
        M_STMFD(1<<REG_LR, REG_SP);
-       M_SUB_IMM_EXT_MUL4(REG_SP, REG_SP, cd->stackframesize - 1);
+       M_SUB_IMM_EXT_MUL4(REG_SP, REG_SP, cd->stackframesize / 4 - 1);
 
 #if !defined(NDEBUG)
        if (JITDATA_HAS_FLAG_VERBOSECALL(jd))
                emit_verbosecall_enter(jd);
 #endif
 
-       /* get function address (this must happen before the stackframeinfo) */
+#if defined(ENABLE_GC_CACAO)
+       /* Save callee saved integer registers in stackframeinfo (GC may
+          need to recover them during a collection). */
 
-       funcdisp = dseg_add_functionptr(cd, f);
+       disp = cd->stackframesize - SIZEOF_VOID_P - sizeof(stackframeinfo_t) +
+               OFFSET(stackframeinfo_t, intregs);
 
-#if !defined(WITH_STATIC_CLASSPATH)
-       if (f == NULL) {
-               codegen_addpatchref(cd, PATCHER_resolve_native, m, funcdisp);
-
-               if (opt_showdisassemble)
-                       M_NOP;
-       }
+       for (i = 0; i < INT_SAV_CNT; i++)
+               M_STR_INTERN(abi_registers_integer_saved[i], REG_SP, disp + i * 4);
 #endif
 
        /* Save integer and float argument registers (these are 4
@@ -2933,11 +2910,8 @@ u1 *createnativestub(functionptr f, jitdata *jd, methoddesc *nmd)
 
        /* create native stackframe info */
 
-       assert(IS_IMM(4*4 + cd->stackframesize * 4));
-       M_ADD_IMM(REG_A0, REG_SP, 4*4 + cd->stackframesize * 4 - SIZEOF_VOID_P);
+       M_ADD_IMM(REG_A0, REG_SP, 4*4);
        M_MOV(REG_A1, REG_PV);
-       M_ADD_IMM(REG_A2, REG_SP, 4*4 + cd->stackframesize * 4);
-       M_LDR_INTERN(REG_A3, REG_SP, 4*4 + cd->stackframesize * 4 - SIZEOF_VOID_P);
        disp = dseg_add_functionptr(cd, codegen_start_native_call);
        M_DSEG_BRANCH(disp);
 
@@ -2946,6 +2920,11 @@ u1 *createnativestub(functionptr f, jitdata *jd, methoddesc *nmd)
        s1 = (s4) (cd->mcodeptr - cd->mcodebase);
        M_RECOMPUTE_PV(s1);
 
+       /* remember class argument */
+
+       if (m->flags & ACC_STATIC)
+               M_MOV(REG_ITMP3, REG_RESULT);
+
        /* Restore integer and float argument registers (these are 4
           registers, stack is 8-byte aligned). */
 
@@ -2955,18 +2934,15 @@ u1 *createnativestub(functionptr f, jitdata *jd, methoddesc *nmd)
        /* copy or spill arguments to new locations */
        /* ATTENTION: the ARM has only integer argument registers! */
 
-       for (i = md->paramcount - 1, j = i + nativeparams; i >= 0; i--, j--) {
+       for (i = md->paramcount - 1, j = i + skipparams; i >= 0; i--, j--) {
                t = md->paramtypes[i].type;
 
                if (!md->params[i].inmemory) {
-                       s1 = ARGUMENT_REGS(t, md->params[i].regoff);
+                       s1 = md->params[i].regoff;
+                       s2 = nmd->params[j].regoff;
 
                        if (!nmd->params[j].inmemory) {
-                               s2 = ARGUMENT_REGS(t, nmd->params[j].regoff);
-
 #if !defined(__ARM_EABI__)
-                               SPLIT_OPEN(t, s1, REG_ITMP1);
-                               SPLIT_LOAD(t, s1, cd->stackframesize);
                                SPLIT_OPEN(t, s2, REG_ITMP1);
 #endif
 
@@ -2980,18 +2956,10 @@ u1 *createnativestub(functionptr f, jitdata *jd, methoddesc *nmd)
 #endif
                        }
                        else {
-                               s2 = nmd->params[j].regoff;
-
-#if !defined(__ARM_EABI__)
-                               SPLIT_OPEN(t, s1, REG_ITMP1);
-                               SPLIT_LOAD(t, s1, cd->stackframesize);
-#endif
-
                                if (IS_2_WORD_TYPE(t))
-                                       M_LST(s1, REG_SP, s2 * 4);
+                                       M_LST(s1, REG_SP, s2);
                                else
-                                       M_IST(s1, REG_SP, s2 * 4);
-                               /* no SPLIT_CLOSE here because argument is fully on stack now */
+                                       M_IST(s1, REG_SP, s2);
                        }
                }
                else {
@@ -2999,31 +2967,34 @@ u1 *createnativestub(functionptr f, jitdata *jd, methoddesc *nmd)
                        s2 = nmd->params[j].regoff;
 
                        if (IS_2_WORD_TYPE(t)) {
-                               M_LLD(REG_ITMP12_PACKED, REG_SP, s1 * 4);
-                               M_LST(REG_ITMP12_PACKED, REG_SP, s2 * 4);
+                               M_LLD(REG_ITMP12_PACKED, REG_SP, s1);
+                               M_LST(REG_ITMP12_PACKED, REG_SP, s2);
                        }
                        else {
-                               M_ILD(REG_ITMP1, REG_SP, s1 * 4);
-                               M_IST(REG_ITMP1, REG_SP, s2 * 4);
+                               M_ILD(REG_ITMP1, REG_SP, s1);
+                               M_IST(REG_ITMP1, REG_SP, s2);
                        }
                }
        }
 
-       /* put class into second argument register */
+       /* Handle native Java methods. */
 
-       if (m->flags & ACC_STATIC) {
-               disp = dseg_add_address(cd, m->class);
-               M_DSEG_LOAD(REG_A1, disp);
-       }
+       if (m->flags & ACC_NATIVE) {
+               /* put class into second argument register */
 
-       /* put env into first argument register */
+               if (m->flags & ACC_STATIC)
+                       M_MOV(REG_A1, REG_ITMP3);
 
-       disp = dseg_add_address(cd, _Jv_env);
-       M_DSEG_LOAD(REG_A0, disp);
+               /* put env into first argument register */
 
-       /* do the native function call */
+               disp = dseg_add_address(cd, _Jv_env);
+               M_DSEG_LOAD(REG_A0, disp);
+       }
+
+       /* Call the native function. */
 
-       M_DSEG_BRANCH(funcdisp);
+       disp = dseg_add_functionptr(cd, f);
+       M_DSEG_BRANCH(disp);
 
        /* recompute pv */
        /* TODO: this is only needed because of the tracer ... do we
@@ -3037,7 +3008,7 @@ u1 *createnativestub(functionptr f, jitdata *jd, methoddesc *nmd)
        /* this depends on gcc; it is independent from our ENABLE_SOFTFLOAT define */
        if (md->returntype.type != TYPE_VOID && IS_FLT_DBL_TYPE(md->returntype.type)) {
 #if 0 && !defined(NDEBUG)
-               dolog("NATIVESTUB that returns float or double (%s.%s)", m->class->name->text, m->name->text);
+               dolog("NATIVESTUB that returns float or double (%s.%s)", m->clazz->name->text, m->name->text);
 #endif
                /* we cannot use this macro, since it is not defined in ENABLE_SOFTFLOAT */
                /* M_CAST_FLT_TO_INT_TYPED(md->returntype.type, REG_FRESULT, REG_RESULT_TYPED(md->returntype.type)); */
@@ -3061,7 +3032,8 @@ u1 *createnativestub(functionptr f, jitdata *jd, methoddesc *nmd)
 
        M_STMFD(BITMASK_RESULT, REG_SP);
 
-       M_ADD_IMM(REG_A0, REG_SP, 2*4 + cd->stackframesize * 4 - SIZEOF_VOID_P);
+       M_ADD_IMM(REG_A0, REG_SP, 2*4);
+       M_MOV(REG_A1, REG_PV);
        disp = dseg_add_functionptr(cd, codegen_finish_native_call);
        M_DSEG_BRANCH(disp);
        s1 = (s4) (cd->mcodeptr - cd->mcodebase);
@@ -3070,15 +3042,26 @@ u1 *createnativestub(functionptr f, jitdata *jd, methoddesc *nmd)
        M_MOV(REG_ITMP1_XPTR, REG_RESULT);
        M_LDMFD(BITMASK_RESULT, REG_SP);
 
+#if defined(ENABLE_GC_CACAO)
+       /* restore callee saved int registers from stackframeinfo (GC might have  */
+       /* modified them during a collection).                                    */
+
+       disp = cd->stackframesize - SIZEOF_VOID_P - sizeof(stackframeinfo_t) +
+               OFFSET(stackframeinfo_t, intregs);
+
+       for (i = 0; i < INT_SAV_CNT; i++)
+               M_LDR_INTERN(abi_registers_integer_saved[i], REG_SP, disp + i * 4);
+#endif
+
        /* finish stub code, but do not yet return to caller */
 
-       M_ADD_IMM_EXT_MUL4(REG_SP, REG_SP, cd->stackframesize - 1);
+       M_ADD_IMM_EXT_MUL4(REG_SP, REG_SP, cd->stackframesize / 4 - 1);
        M_LDMFD(1<<REG_LR, REG_SP);
 
        /* check for exception */
 
        M_TST(REG_ITMP1_XPTR, REG_ITMP1_XPTR);
-       M_MOVEQ(REG_PC, REG_LR);            /* if no exception, return to caller  */
+       M_MOVEQ(REG_LR, REG_PC);            /* if no exception, return to caller  */
 
        /* handle exception here */
 
@@ -3087,14 +3070,6 @@ u1 *createnativestub(functionptr f, jitdata *jd, methoddesc *nmd)
        disp = dseg_add_functionptr(cd, asm_handle_nat_exception);
        M_DSEG_LOAD(REG_ITMP3, disp);       /* load asm exception handler address */
        M_MOV(REG_PC, REG_ITMP3);           /* jump to asm exception handler      */
-
-       /* generate patcher stubs */
-
-       emit_patcher_stubs(jd);
-
-       codegen_finish(jd);
-
-       return code->entrypoint;
 }