Split NativeThumb.cpp into NativeThumb.cpp and NativeARM.cpp; no code changes.

2024-09-13 09:24:08 -07:00 · 2008-09-02 22:29:23 -07:00 · 2008-09-02 22:29:23 -07:00 · 2a520bab9f
commit 2a520bab9f
parent 420e72ed85
3 changed files with 574 additions and 209 deletions
--- a/js/src/config/Linux_All.mk
+++ b/js/src/config/Linux_All.mk
@ -80,7 +80,7 @@ endif

 ifeq ($(CPU_ARCH),arm)
 OS_CFLAGS += -DAVMPLUS_ARM -DAVMPLUS_LINUX
-NANOJIT_ARCH = Thumb
+NANOJIT_ARCH = ARM
 endif

 GFX_ARCH = x
--- a/js/src/nanojit/NativeARM.cpp
+++ b/js/src/nanojit/NativeARM.cpp
@ -0,0 +1,573 @@
+/* -*- Mode: C++; c-basic-offset: 4; indent-tabs-mode: t; tab-width: 4 -*- */
+/* ***** BEGIN LICENSE BLOCK *****
+ * Version: MPL 1.1/GPL 2.0/LGPL 2.1
+ *
+ * The contents of this file are subject to the Mozilla Public License Version
+ * 1.1 (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ * http://www.mozilla.org/MPL/
+ *
+ * Software distributed under the License is distributed on an "AS IS" basis,
+ * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
+ * for the specific language governing rights and limitations under the
+ * License.
+ *
+ * The Original Code is [Open Source Virtual Machine].
+ *
+ * The Initial Developer of the Original Code is
+ * Adobe System Incorporated.
+ * Portions created by the Initial Developer are Copyright (C) 2004-2007
+ * the Initial Developer. All Rights Reserved.
+ *
+ * Contributor(s):
+ *   Adobe AS3 Team
+ *
+ * Alternatively, the contents of this file may be used under the terms of
+ * either the GNU General Public License Version 2 or later (the "GPL"), or
+ * the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
+ * in which case the provisions of the GPL or the LGPL are applicable instead
+ * of those above. If you wish to allow use of your version of this file only
+ * under the terms of either the GPL or the LGPL, and not to allow others to
+ * use your version of this file under the terms of the MPL, indicate your
+ * decision by deleting the provisions above and replace them with the notice
+ * and other provisions required by the GPL or the LGPL. If you do not delete
+ * the provisions above, a recipient may use your version of this file under
+ * the terms of any one of the MPL, the GPL or the LGPL.
+ *
+ * ***** END LICENSE BLOCK ***** */
+
+#include "nanojit.h"
+
+#ifdef AVMPLUS_PORTING_API
+#include "portapi_nanojit.h"
+#endif
+
+#ifdef UNDER_CE
+#include <cmnintrin.h>
+#endif
+
+#if defined(AVMPLUS_LINUX)
+#include <asm/unistd.h>
+#endif
+
+namespace nanojit
+{
+	#ifdef FEATURE_NANOJIT
+
+#ifdef NJ_VERBOSE
+	const char* regNames[] = {"r0","r1","r2","r3","r4","r5","r6","r7","r8","r9","r10","r11","IP","SP","LR","PC"};
+
+#endif
+    const Register Assembler::argRegs[] = { R0, R1, R2, R3 };
+    const Register Assembler::retRegs[] = { R0, R1 };
+
+	void Assembler::nInit(AvmCore*)
+	{
+		// all ARMs have conditional move
+		has_cmov = true;
+	}
+
+	NIns* Assembler::genPrologue(RegisterMask needSaving)
+	{
+		/**
+		 * Prologue
+		 */
+
+		// NJ_RESV_OFFSET is space at the top of the stack for us
+		// to use for parameter passing (8 bytes at the moment)
+		uint32_t stackNeeded = 4 * _activation.highwatermark + NJ_STACK_OFFSET;
+		uint32_t savingCount = 0;
+
+		uint32_t savingMask = 0;
+		savingCount = 9; //R4-R10,R11,LR
+		savingMask = SavedRegs | rmask(FRAME_PTR);
+		(void)needSaving;
+
+		// so for alignment purposes we've pushed  return addr, fp, and savingCount registers
+		uint32_t stackPushed = 4 * (2+savingCount);
+		uint32_t aligned = alignUp(stackNeeded + stackPushed, NJ_ALIGN_STACK);
+		int32_t amt = aligned - stackPushed;
+
+		// Make room on stack for what we are doing
+		if (amt)
+		{ 
+			SUBi(SP, amt); 
+		}
+
+		verbose_only( verbose_outputf("         %p:",_nIns); )
+        verbose_only( verbose_output("         patch entry"); )
+        NIns *patchEntry = _nIns;
+
+		MR(FRAME_PTR, SP);
+		PUSH_mask(savingMask|rmask(LR));
+		return patchEntry;
+	}
+
+	void Assembler::nFragExit(LInsp guard)
+	{
+		SideExit* exit = guard->exit();
+		Fragment *frag = exit->target;
+		GuardRecord *lr;
+		if (frag && frag->fragEntry)
+		{
+			JMP(frag->fragEntry);
+			lr = 0;
+		}
+		else
+		{
+			// target doesn't exit yet.  emit jump to epilog, and set up to patch later.
+			lr = placeGuardRecord(guard);
+
+			// we need to know that there's an extra immediate value available
+			// for us; always force a far jump here.
+			BL_far(_epilogue);
+
+			lr->jmp = _nIns;
+		}
+
+		// pop the stack frame first
+		MR(SP, FRAME_PTR);
+
+        #ifdef NJ_VERBOSE
+        if (_frago->core()->config.show_stats) {
+			// load R1 with Fragment *fromFrag, target fragment
+			// will make use of this when calling fragenter().
+            int fromfrag = int((Fragment*)_thisfrag);
+            LDi(argRegs[1], fromfrag);
+        }
+        #endif
+
+		// return value is GuardRecord*
+        LDi(R2, int(lr));
+	}
+
+	NIns* Assembler::genEpilogue(RegisterMask restore)
+	{
+		BX(LR); // return
+		MR(R0,R2); // return LinkRecord*
+		RegisterMask savingMask = restore | rmask(FRAME_PTR) | rmask(LR);
+		POP_mask(savingMask); // regs
+		return _nIns;
+	}
+	
+	void Assembler::asm_call(LInsp ins)
+	{
+        const CallInfo* call = callInfoFor(ins->fid());
+		uint32_t atypes = call->_argtypes;
+		uint32_t roffset = 0;
+
+		// we need to detect if we have arg0 as LO followed by arg1 as F;
+		// in that case, we need to skip using r1 -- the F needs to be
+		// loaded in r2/r3, at least according to the ARM EABI and gcc 4.2's
+		// generated code.
+		bool arg0IsInt32FollowedByFloat = false;
+		while ((atypes & 3) != ARGSIZE_NONE) {
+			if (((atypes >> 4) & 3) == ARGSIZE_LO &&
+				((atypes >> 2) & 3) == ARGSIZE_F &&
+				((atypes >> 6) & 3) == ARGSIZE_NONE)
+			{
+				arg0IsInt32FollowedByFloat = true;
+				break;
+			}
+			atypes >>= 2;
+		}
+
+		CALL(call);
+        ArgSize sizes[10];
+        uint32_t argc = call->get_sizes(sizes);
+		for(uint32_t i=0; i < argc; i++)
+		{
+            uint32_t j = argc - i - 1;
+            ArgSize sz = sizes[j];
+            NanoAssert(sz == ARGSIZE_LO || sz == ARGSIZE_Q);
+    		// pre-assign registers R0-R3 for arguments (if they fit)
+            Register r = (i+roffset) < 4 ? argRegs[i+roffset] : UnknownReg;
+            asm_arg(sz, ins->arg(j), r);
+
+			if (i == 0 && arg0IsInt32FollowedByFloat)
+				roffset = 1;
+		}
+	}
+	
+	void Assembler::nMarkExecute(Page* page, int32_t count, bool enable)
+	{
+	#ifdef UNDER_CE
+		DWORD dwOld;
+		VirtualProtect(page, NJ_PAGE_SIZE, PAGE_EXECUTE_READWRITE, &dwOld);
+	#endif
+	#ifdef AVMPLUS_PORTING_API
+		NanoJIT_PortAPI_MarkExecutable(page, (void*)((int32_t)page+count));
+	#endif
+		(void)page;
+		(void)count;
+		(void)enable;
+	}
+			
+	Register Assembler::nRegisterAllocFromSet(int set)
+	{
+		// Note: The clz instruction only works on armv5 and up.
+#ifndef UNDER_CE
+#ifdef __ARMCC__
+		register int i;
+		__asm { clz i,set }
+		Register r = Register(31-i);
+		_allocator.free &= ~rmask(r);
+		return r;
+#else
+		// need to implement faster way
+		int i=0;
+		while (!(set & rmask((Register)i)))
+			i ++;
+		_allocator.free &= ~rmask((Register)i);
+		return (Register) i;
+#endif
+#else
+		Register r;
+		r = (Register)_CountLeadingZeros(set);
+		r = (Register)(31-r);
+		_allocator.free &= ~rmask(r);
+		return r;
+#endif
+
+	}
+
+	void Assembler::nRegisterResetAll(RegAlloc& a)
+	{
+		// add scratch registers to our free list for the allocator
+		a.clear();
+		a.used = 0;
+		a.free = rmask(R0) | rmask(R1) | rmask(R2) | rmask(R3) | rmask(R4) | rmask(R5);
+		debug_only(a.managed = a.free);
+	}
+
+	void Assembler::nPatchBranch(NIns* branch, NIns* target)
+	{
+		// Patch the jump in a loop
+
+		// This is ALWAYS going to be a long branch (using the BL instruction)
+		// Which is really 2 instructions, so we need to modify both
+		// XXX -- this is B, not BL, at least on non-Thumb..
+
+		// branch+2 because PC is always 2 instructions ahead on ARM/Thumb
+		int32_t offset = int(target) - int(branch+2);
+
+		//printf("---patching branch at 0x%08x to location 0x%08x (%d-0x%08x)\n", branch, target, offset, offset);
+
+		// We have 2 words to work with here -- if offset is in range of a 24-bit
+		// relative jump, emit that; otherwise, we do a pc-relative load into pc.
+		if (-(1<<24) <= offset & offset < (1<<24)) {
+			// ARM goodness, using unconditional B
+			*branch = (NIns)( COND_AL | (0xA<<24) | ((offset >>2) & 0xFFFFFF) );
+		} else {
+			// LDR pc,[pc]
+			*branch++ = (NIns)( COND_AL | (0x51<<20) | (PC<<16) | (PC<<12) | ( 0x004 ) );
+			*branch = (NIns)target;
+		}
+	}
+
+	RegisterMask Assembler::hint(LIns* i, RegisterMask allow /* = ~0 */)
+	{
+		uint32_t op = i->opcode();
+		int prefer = ~0;
+
+		if (op==LIR_call || op==LIR_fcall)
+			prefer = rmask(R0);
+		else if (op == LIR_callh)
+			prefer = rmask(R1);
+		else if (op == LIR_param)
+			prefer = rmask(imm2register(i->imm8()));
+
+		if (_allocator.free & allow & prefer)
+			allow &= prefer;
+		return allow;
+	}
+
+    void Assembler::asm_qjoin(LIns *ins)
+    {
+		int d = findMemFor(ins);
+		AvmAssert(d);
+		LIns* lo = ins->oprnd1();
+		LIns* hi = ins->oprnd2();
+							
+		Register r = findRegFor(hi, GpRegs);
+		ST(FP, d+4, r);
+
+        // okay if r gets recycled.
+		r = findRegFor(lo, GpRegs);
+		ST(FP, d, r);
+        freeRsrcOf(ins, false);	// if we had a reg in use, emit a ST to flush it to mem
+    }
+
+    void Assembler::asm_store32(LIns *value, int dr, LIns *base)
+    {
+	    // make sure what is in a register
+	    Reservation *rA, *rB;
+	    findRegFor2(GpRegs, value, rA, base, rB);
+	    Register ra = rA->reg;
+	    Register rb = rB->reg;
+	    ST(rb, dr, ra);
+    }
+
+	void Assembler::asm_restore(LInsp i, Reservation *resv, Register r)
+	{
+		(void)resv;
+        int d = findMemFor(i);
+	    LD(r, d, FP);
+		verbose_only(if (_verbose) {
+			outputf("        restore %s",_thisfrag->lirbuf->names->formatRef(i));
+		})
+	}
+
+	void Assembler::asm_spill(LInsp i, Reservation *resv, bool pop)
+	{
+    (void)i;
+		(void)pop;
+		if (resv->arIndex)
+		{
+			int d = disp(resv);
+			// save to spill location
+			Register rr = resv->reg;
+			ST(FP, d, rr);
+			verbose_only(if (_verbose){
+				outputf("        spill %s",_thisfrag->lirbuf->names->formatRef(i));
+			})
+		}
+	}
+
+	void Assembler::asm_load64(LInsp ins)
+	{
+		LIns* base = ins->oprnd1();
+		int db = ins->oprnd2()->constval();
+		Reservation *resv = getresv(ins);
+		int dr = disp(resv);
+		NanoAssert(resv->reg == UnknownReg && dr != 0);
+
+		Register rb = findRegFor(base, GpRegs);
+		resv->reg = UnknownReg;
+		asm_mmq(FP, dr, rb, db);
+		freeRsrcOf(ins, false);
+	}
+
+	void Assembler::asm_store64(LInsp value, int dr, LInsp base)
+	{
+		int da = findMemFor(value);
+	    Register rb = findRegFor(base, GpRegs);
+	    asm_mmq(rb, dr, FP, da);
+	}
+
+	void Assembler::asm_quad(LInsp ins)
+	{
+		Reservation *rR = getresv(ins);
+		int d = disp(rR);
+		freeRsrcOf(ins, false);
+		if (d)
+		{
+			const int32_t* p = (const int32_t*) (ins-2);
+			STi(FP,d+4,p[1]);
+			STi(FP,d,p[0]);
+		}
+	}
+
+	bool Assembler::asm_qlo(LInsp ins, LInsp q)
+	{
+		(void)ins; (void)q;
+		return false;
+	}
+
+	void Assembler::asm_nongp_copy(Register r, Register s)
+	{
+		// we will need this for VFP support
+		(void)r; (void)s;
+		NanoAssert(false);
+	}
+
+	Register Assembler::asm_binop_rhs_reg(LInsp ins)
+	{
+		return UnknownReg;
+	}
+
+    /**
+     * copy 64 bits: (rd+dd) <- (rs+ds)
+     */
+    void Assembler::asm_mmq(Register rd, int dd, Register rs, int ds)
+    {
+        // value is either a 64bit struct or maybe a float
+        // that isn't live in an FPU reg.  Either way, don't
+        // put it in an FPU reg just to load & store it.
+		// get a scratch reg
+		Register t = registerAlloc(GpRegs & ~(rmask(rd)|rmask(rs)));
+		_allocator.addFree(t);
+		ST(rd, dd+4, t);
+		LD(t, ds+4, rs);
+		ST(rd, dd, t);
+		LD(t, ds, rs);
+    }
+
+	void Assembler::asm_pusharg(LInsp p)
+	{
+		// arg goes on stack
+		Reservation* rA = getresv(p);
+		if (rA == 0)
+		{
+			Register ra = findRegFor(p, GpRegs);
+			ST(SP,0,ra);
+		}
+		else if (rA->reg == UnknownReg)
+		{
+			ST(SP,0,Scratch);
+			LD(Scratch,disp(rA),FP);
+		}
+		else
+		{
+			ST(SP,0,rA->reg);
+		}
+	}
+
+	void Assembler::nativePageReset()
+	{
+			_nSlot = 0;
+			_nExitSlot = 0;
+	}
+
+	void Assembler::nativePageSetup()
+	{
+		if (!_nIns)		 _nIns	   = pageAlloc();
+		if (!_nExitIns)  _nExitIns = pageAlloc(true);
+		//fprintf(stderr, "assemble onto %x exits into %x\n", (int)_nIns, (int)_nExitIns);
+	
+		if (!_nSlot)
+		{
+			// This needs to be done or the samepage macro gets confused; pageAlloc
+			// gives us a pointer to just past the end of the page.
+			_nIns--;
+			_nExitIns--;
+
+			// constpool starts at top of page and goes down,
+			// code starts at bottom of page and moves up
+			_nSlot = pageDataStart(_nIns); //(int*)(&((Page*)pageTop(_nIns))->lir[0]);
+		}
+	}
+
+	void Assembler::flushCache(NIns* n1, NIns* n2) {
+#if defined(UNDER_CE)
+ 		// we changed the code, so we need to do this (sadly)
+		FlushInstructionCache(GetCurrentProcess(), NULL, NULL);
+#elif defined(AVMPLUS_LINUX)
+		// Just need to clear this one page (not even the whole page really)
+		//Page *page = (Page*)pageTop(_nIns);
+		register unsigned long _beg __asm("a1") = (unsigned long)(n1);
+		register unsigned long _end __asm("a2") = (unsigned long)(n2);
+		register unsigned long _flg __asm("a3") = 0;
+		register unsigned long _swi __asm("r7") = 0xF0002;
+		__asm __volatile ("swi 0 	@ sys_cacheflush" : "=r" (_beg) : "0" (_beg), "r" (_end), "r" (_flg), "r" (_swi));
+#endif
+	}
+
+	NIns* Assembler::asm_adjustBranch(NIns* at, NIns* target)
+	{
+		// This always got emitted as a BL_far sequence; at points
+		// to the first of 4 instructions.  Ensure that we're where
+		// we think we were..
+		NanoAssert(at[1] == (NIns)( COND_AL | OP_IMM | (1<<23) | (PC<<16) | (LR<<12) | (4) ));
+		NanoAssert(at[2] == (NIns)( COND_AL | (0x9<<21) | (0xFFF<<8) | (1<<4) | (IP) ));
+
+		NIns* was = (NIns*) at[3];
+
+		at[3] = (NIns)target;
+
+		flushCache(at, at+4);
+
+#ifdef AVMPLUS_PORTING_API
+		NanoJIT_PortAPI_FlushInstructionCache(at, at+4);
+#endif
+
+		return was;
+	}
+
+	void Assembler::underrunProtect(int bytes)
+	{
+		intptr_t u = bytes + sizeof(PageHeader)/sizeof(NIns) + 8;
+		if ( (samepage(_nIns,_nSlot) && (((intptr_t)_nIns-u) <= intptr_t(_nSlot+1))) ||
+			 (!samepage((intptr_t)_nIns-u,_nIns)) )
+		{
+			NIns* target = _nIns;
+
+			_nIns = pageAlloc(_inExit);
+
+			// XXX _nIns at this point points to one past the end of
+			// the page, intended to be written into using *(--_nIns).
+			// However, (guess) something seems to be storing the value
+			// of _nIns as is, and then later generating a jump to a bogus
+			// address.  So pre-decrement to ensure that it's always
+			// valid; we end up skipping using the last instruction this
+			// way.
+			_nIns--;
+
+			// Update slot, either to _nIns (if decremented above), or
+			// _nIns-1 once the above bug is fixed/found.
+			_nSlot = pageDataStart(_nIns);
+
+			// If samepage() is used on _nIns and _nSlot, it'll fail, since _nIns
+			// points to one past the end of the page right now.  Assume that 
+			// JMP_nochk won't ever try to write to _nSlot, and so won't ever
+			// check samepage().  See B_cond_chk macro.
+			JMP_nochk(target);
+		} else if (!_nSlot) {
+			// make sure that there's always a slot pointer
+			_nSlot = pageDataStart(_nIns);
+		}
+	}
+
+	void Assembler::BL_far(NIns* addr) {
+		// we have to stick an immediate into the stream and make lr
+		// point to the right spot before branching
+		underrunProtect(16);
+
+		// the address
+		*(--_nIns) = (NIns)((addr));
+		// bx ip             // branch to the address we loaded earlier
+		*(--_nIns) = (NIns)( COND_AL | (0x9<<21) | (0xFFF<<8) | (1<<4) | (IP) );
+		// add lr, [pc + #4] // set lr to be past the address that we wrote
+		*(--_nIns) = (NIns)( COND_AL | OP_IMM | (1<<23) | (PC<<16) | (LR<<12) | (4) );
+		// ldr ip, [pc + #4] // load the address into ip, reading it from [pc+4]
+		*(--_nIns) = (NIns)( COND_AL | (0x59<<20) | (PC<<16) | (IP<<12) | (4));
+		asm_output1("bl %p (32-bit)", addr);
+	}
+
+	void Assembler::BL(NIns* addr) {
+		intptr_t offs = PC_OFFSET_FROM(addr,(intptr_t)_nIns-4);
+		if (JMP_S24_OFFSET_OK(offs)) {
+			// we can do this with a single BL call
+			underrunProtect(4);
+			*(--_nIns) = (NIns)( COND_AL | (0xB<<24) | (((offs)>>2) & 0xFFFFFF) ); \
+			asm_output1("bl %p", addr);
+		} else {
+			BL_far(addr);
+		}
+	}
+
+	void Assembler::CALL(const CallInfo *ci)
+	{
+        intptr_t addr = ci->_address;
+		BL((NIns*)addr);
+		asm_output1("   (call %s)", ci->_name);
+	}
+
+	void Assembler::LD32_nochk(Register r, int32_t imm)
+	{
+		// We can always reach the const pool, since it's on the same page (<4096)
+		underrunProtect(8);
+
+		*(++_nSlot) = (int)imm;
+
+		//fprintf (stderr, "wrote slot(2) %p with %08x, jmp @ %p\n", _nSlot, (intptr_t)imm, _nIns-1);
+
+		int offset = PC_OFFSET_FROM(_nSlot,(intptr_t)(_nIns)-4);
+
+		NanoAssert(JMP_S24_OFFSET_OK(offset) && (offset < 0));
+
+		*(--_nIns) = (NIns)( COND_AL | (0x51<<20) | (PC<<16) | ((r)<<12) | ((-offset) & 0xFFFFFF) );
+		asm_output2("ld %s,%d",gpn(r),imm);
+	}
+    #endif /* FEATURE_NANOJIT */
+}
--- a/js/src/nanojit/NativeThumb.cpp
+++ b/js/src/nanojit/NativeThumb.cpp
@ -63,13 +63,8 @@ namespace nanojit

 	void Assembler::nInit(AvmCore*)
 	{
-	#ifdef NJ_THUMB_JIT
 		// Thumb mode does not have conditional move, alas
 		has_cmov = false;
-	#else
-		// all ARMs have conditional move
-		has_cmov = true;
-	#endif
 	}

 	NIns* Assembler::genPrologue(RegisterMask needSaving)
@ -84,15 +79,9 @@ namespace nanojit
 		uint32_t savingCount = 0;

 		uint32_t savingMask = 0;
-		#if defined(NJ_THUMB_JIT)
 		savingCount = 5; // R4-R7, LR
 		savingMask = 0xF0;
 		(void)needSaving;
-		#else
-		savingCount = 9; //R4-R10,R11,LR
-		savingMask = SavedRegs | rmask(FRAME_PTR);
-		(void)needSaving;
-		#endif

 		// so for alignment purposes we've pushed  return addr, fp, and savingCount registers
 		uint32_t stackPushed = 4 * (2+savingCount);
@ -101,7 +90,6 @@ namespace nanojit

 		// Make room on stack for what we are doing
 		if (amt)
-#ifdef NJ_THUMB_JIT
 		{
 			// largest value is 508 (7-bits << 2)
 			if (amt>508)
@ -120,11 +108,6 @@ namespace nanojit
 				SUBi(SP, amt); 

 		}
-#else
-		{ 
-			SUBi(SP, amt); 
-		}
-#endif
 		verbose_only( verbose_outputf("         %p:",_nIns); )
        verbose_only( verbose_output("         patch entry"); )
        NIns *patchEntry = _nIns;
@ -149,13 +132,7 @@ namespace nanojit
 			// target doesn't exit yet.  emit jump to epilog, and set up to patch later.
 			lr = placeGuardRecord(guard);

-#ifdef NJ_THUMB_JIT
 			BL(_epilogue);
-#else
-			// we need to know that there's an extra immediate value available
-			// for us; always force a far jump here.
-			BL_far(_epilogue);
-#endif

 			lr->jmp = _nIns;
 		}
@ -178,7 +155,6 @@ namespace nanojit

 	NIns* Assembler::genEpilogue(RegisterMask restore)
 	{
-#ifdef NJ_THUMB_JIT
 		(void)restore;
 		if (false) {
 			// interworking
@ -191,13 +167,6 @@ namespace nanojit
 		}
 		MR(R0,R2); // return LinkRecord*
 		return _nIns;
-#else
-		BX(LR); // return
-		MR(R0,R2); // return LinkRecord*
-		RegisterMask savingMask = restore | rmask(FRAME_PTR) | rmask(LR);
-		POP_mask(savingMask); // regs
-		return _nIns;
-#endif
 	}
 	
 	void Assembler::asm_call(LInsp ins)
@ -255,40 +224,12 @@ namespace nanojit
 			
 	Register Assembler::nRegisterAllocFromSet(int set)
 	{
-#ifdef NJ_THUMB_JIT
 		// need to implement faster way
 		int i=0;
 		while (!(set & rmask((Register)i)))
 			i ++;
 		_allocator.free &= ~rmask((Register)i);
 		return (Register) i;
-
-#else
-		// Note: The clz instruction only works on armv5 and up.
-#ifndef UNDER_CE
-#ifdef __ARMCC__
-		register int i;
-		__asm { clz i,set }
-		Register r = Register(31-i);
-		_allocator.free &= ~rmask(r);
-		return r;
-#else
-		// need to implement faster way
-		int i=0;
-		while (!(set & rmask((Register)i)))
-			i ++;
-		_allocator.free &= ~rmask((Register)i);
-		return (Register) i;
-#endif
-#else
-		Register r;
-		r = (Register)_CountLeadingZeros(set);
-		r = (Register)(31-r);
-		_allocator.free &= ~rmask(r);
-		return r;
-#endif
-#endif
-
 	}

 	void Assembler::nRegisterResetAll(RegAlloc& a)
@ -313,22 +254,9 @@ namespace nanojit

 		//printf("---patching branch at 0x%08x to location 0x%08x (%d-0x%08x)\n", branch, target, offset, offset);

-#ifdef NJ_THUMB_JIT
 		NanoAssert(-(1<<21) <= offset && offset < (1<<21)); 
 		*branch++ = (NIns)(0xF000 | (offset>>12)&0x7FF);
 		*branch =   (NIns)(0xF800 | (offset>>1)&0x7FF);
-#else
-		// We have 2 words to work with here -- if offset is in range of a 24-bit
-		// relative jump, emit that; otherwise, we do a pc-relative load into pc.
-		if (-(1<<24) <= offset & offset < (1<<24)) {
-			// ARM goodness, using unconditional B
-			*branch = (NIns)( COND_AL | (0xA<<24) | ((offset >>2) & 0xFFFFFF) );
-		} else {
-			// LDR pc,[pc]
-			*branch++ = (NIns)( COND_AL | (0x51<<20) | (PC<<16) | (PC<<12) | ( 0x004 ) );
-			*branch = (NIns)target;
-		}
-#endif
 	}

 	RegisterMask Assembler::hint(LIns* i, RegisterMask allow /* = ~0 */)
@ -491,15 +419,10 @@ namespace nanojit

 	void Assembler::nativePageReset()
 	{
-		#ifdef NJ_THUMB_JIT
 			_nPool = 0;
 			_nSlot = 0;
 			_nExitPool = 0;
 			_nExitSlot = 0;
-		#else
-			_nSlot = 0;
-			_nExitSlot = 0;
-		#endif
 	}

 	void Assembler::nativePageSetup()
@ -508,7 +431,6 @@ namespace nanojit
 		if (!_nExitIns)  _nExitIns = pageAlloc(true);
 		//fprintf(stderr, "assemble onto %x exits into %x\n", (int)_nIns, (int)_nExitIns);
 	
-		#ifdef NJ_THUMB_JIT
 		if (!_nPool) {
 			_nSlot = _nPool = (int*)_nIns;

@ -525,19 +447,6 @@ namespace nanojit

 			// no branch needed since this follows the epilogue
        }
-		#else
-		if (!_nSlot)
-		{
-			// This needs to be done or the samepage macro gets confused; pageAlloc
-			// gives us a pointer to just past the end of the page.
-			_nIns--;
-			_nExitIns--;
-
-			// constpool starts at top of page and goes down,
-			// code starts at bottom of page and moves up
-			_nSlot = pageDataStart(_nIns); //(int*)(&((Page*)pageTop(_nIns))->lir[0]);
-		}
-		#endif
 	}

 	void Assembler::flushCache(NIns* n1, NIns* n2) {
@ -555,8 +464,6 @@ namespace nanojit
 #endif
 	}

-#ifdef NJ_THUMB_JIT
-
 	NIns* Assembler::asm_adjustBranch(NIns* at, NIns* target)
 	{
 		NIns* save = _nIns;
@ -896,104 +803,8 @@ namespace nanojit
 		}
 	}

-#else // ARM_JIT
-	NIns* Assembler::asm_adjustBranch(NIns* at, NIns* target)
-	{
-		// This always got emitted as a BL_far sequence; at points
-		// to the first of 4 instructions.  Ensure that we're where
-		// we think we were..
-		NanoAssert(at[1] == (NIns)( COND_AL | OP_IMM | (1<<23) | (PC<<16) | (LR<<12) | (4) ));
-		NanoAssert(at[2] == (NIns)( COND_AL | (0x9<<21) | (0xFFF<<8) | (1<<4) | (IP) ));
-
-		NIns* was = (NIns*) at[3];
-
-		at[3] = (NIns)target;
-
-		flushCache(at, at+4);
-
-#ifdef AVMPLUS_PORTING_API
-		NanoJIT_PortAPI_FlushInstructionCache(at, at+4);
-#endif
-
-		return was;
-	}
-
-	void Assembler::underrunProtect(int bytes)
-	{
-		intptr_t u = bytes + sizeof(PageHeader)/sizeof(NIns) + 8;
-		if ( (samepage(_nIns,_nSlot) && (((intptr_t)_nIns-u) <= intptr_t(_nSlot+1))) ||
-			 (!samepage((intptr_t)_nIns-u,_nIns)) )
-		{
-			NIns* target = _nIns;
-
-			_nIns = pageAlloc(_inExit);
-
-			// XXX _nIns at this point points to one past the end of
-			// the page, intended to be written into using *(--_nIns).
-			// However, (guess) something seems to be storing the value
-			// of _nIns as is, and then later generating a jump to a bogus
-			// address.  So pre-decrement to ensure that it's always
-			// valid; we end up skipping using the last instruction this
-			// way.
-			_nIns--;
-
-			// Update slot, either to _nIns (if decremented above), or
-			// _nIns-1 once the above bug is fixed/found.
-			_nSlot = pageDataStart(_nIns);
-
-			// If samepage() is used on _nIns and _nSlot, it'll fail, since _nIns
-			// points to one past the end of the page right now.  Assume that 
-			// JMP_nochk won't ever try to write to _nSlot, and so won't ever
-			// check samepage().  See B_cond_chk macro.
-			JMP_nochk(target);
-		} else if (!_nSlot) {
-			// make sure that there's always a slot pointer
-			_nSlot = pageDataStart(_nIns);
-		}
-	}
-
-	void Assembler::BL_far(NIns* addr) {
-		// we have to stick an immediate into the stream and make lr
-		// point to the right spot before branching
-		underrunProtect(16);
-
-		// the address
-		*(--_nIns) = (NIns)((addr));
-		// bx ip             // branch to the address we loaded earlier
-		*(--_nIns) = (NIns)( COND_AL | (0x9<<21) | (0xFFF<<8) | (1<<4) | (IP) );
-		// add lr, [pc + #4] // set lr to be past the address that we wrote
-		*(--_nIns) = (NIns)( COND_AL | OP_IMM | (1<<23) | (PC<<16) | (LR<<12) | (4) );
-		// ldr ip, [pc + #4] // load the address into ip, reading it from [pc+4]
-		*(--_nIns) = (NIns)( COND_AL | (0x59<<20) | (PC<<16) | (IP<<12) | (4));
-		asm_output1("bl %p (32-bit)", addr);
-	}
-
-	void Assembler::BL(NIns* addr) {
-		intptr_t offs = PC_OFFSET_FROM(addr,(intptr_t)_nIns-4);
-		if (JMP_S24_OFFSET_OK(offs)) {
-			// we can do this with a single BL call
-			underrunProtect(4);
-			*(--_nIns) = (NIns)( COND_AL | (0xB<<24) | (((offs)>>2) & 0xFFFFFF) ); \
-			asm_output1("bl %p", addr);
-		} else {
-			BL_far(addr);
-		}
-	}
-
-	void Assembler::CALL(const CallInfo *ci)
-	{
-        intptr_t addr = ci->_address;
-		BL((NIns*)addr);
-		asm_output1("   (call %s)", ci->_name);
-	}
-
-#endif // NJ_THUMB_JIT
-
-	
 	void Assembler::LD32_nochk(Register r, int32_t imm)
 	{
-	#ifdef NJ_THUMB_JIT
-
 		// Can we reach the current slot/pool?
 		int offset = (int)(_nSlot) - (int)(_nIns);
 		if ((offset>=NJ_MAX_CPOOL_OFFSET || offset<0) ||
@ -1023,25 +834,6 @@ namespace nanojit
 		int data_off = int(data) - (int(_nIns+1)&~3);
 		*(--_nIns) = (NIns)(0x4800 | r<<8 | data_off>>2);
 		asm_output3("ldr %s,%d(PC) [%X]",gpn(r),data_off,(int)data);
-
-
-	#else
-
-		// We can always reach the const pool, since it's on the same page (<4096)
-		underrunProtect(8);
-
-		*(++_nSlot) = (int)imm;
-
-		//fprintf (stderr, "wrote slot(2) %p with %08x, jmp @ %p\n", _nSlot, (intptr_t)imm, _nIns-1);
-
-		int offset = PC_OFFSET_FROM(_nSlot,(intptr_t)(_nIns)-4);
-
-		NanoAssert(JMP_S24_OFFSET_OK(offset) && (offset < 0));
-
-		*(--_nIns) = (NIns)( COND_AL | (0x51<<20) | (PC<<16) | ((r)<<12) | ((-offset) & 0xFFFFFF) );
-		asm_output2("ld %s,%d",gpn(r),imm);
-	#endif
-
 	}
    #endif /* FEATURE_NANOJIT */
 }