vm/compiler/codegen/mips/Mips32/Gen.cpp - platform/dalvik - Git at Google

 /*
  * Copyright (C) 2009 The Android Open Source Project
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 /*
  * This file contains codegen for the Mips ISA and is intended to be
  * includes by:
  *
  *        Codegen-$(TARGET_ARCH_VARIANT).c
  *
  */

 /*
  * Reserve 8 bytes at the beginning of the trace
  *        +----------------------------+
  *        | prof count addr (4 bytes)  |
  *        +----------------------------+
  *        | chain cell offset (4 bytes)|
  *        +----------------------------+
  *
  * ...and then code to increment the execution
  *
  * For continuous profiling (24 bytes)
  *       lahi  a0, addr    # get ptr to prof count addr into a0
  *       lalo  a0, addr
  *       lw    a0, 0(a0)   # read prof count addr into a0
  *       lw    a1, 0(a0)   # read prof count into a1
  *       addiu a1, a1, 1   # increment count
  *       sw    a1, 0(a0)   # store count
  *
  * For periodic profiling (8 bytes)
  *       call  TEMPLATE_PERIODIC_PROFILING
  *       nop
  *
  * and return the size (in bytes) of the generated code.
  */
 static int genTraceProfileEntry(CompilationUnit *cUnit)
 {
     intptr_t addr = (intptr_t)dvmJitNextTraceCounter();
     assert(__BYTE_ORDER == __LITTLE_ENDIAN);
     MipsLIR *executionCount = newLIR1(cUnit, kMips32BitData, addr);
     cUnit->chainCellOffsetLIR =
         (LIR *) newLIR1(cUnit, kMips32BitData, CHAIN_CELL_OFFSET_TAG);
     cUnit->headerSize = 8;
     if ((gDvmJit.profileMode == kTraceProfilingContinuous) ||
         (gDvmJit.profileMode == kTraceProfilingDisabled)) {
         MipsLIR *loadAddr = newLIR2(cUnit, kMipsLahi, r_A0, 0);
         loadAddr->generic.target = (LIR *) executionCount;
         loadAddr = newLIR3(cUnit, kMipsLalo, r_A0, r_A0, 0);
         loadAddr ->generic.target = (LIR *) executionCount;
         newLIR3(cUnit, kMipsLw, r_A0, 0, r_A0);
         newLIR3(cUnit, kMipsLw, r_A1, 0, r_A0);
         newLIR3(cUnit, kMipsAddiu, r_A1, r_A1, 1);
         newLIR3(cUnit, kMipsSw, r_A1, 0, r_A0);
         return 24;
     } else {
         int opcode = TEMPLATE_PERIODIC_PROFILING;
         newLIR1(cUnit, kMipsJal,
             (int) gDvmJit.codeCache + templateEntryOffsets[opcode]);
         newLIR0(cUnit, kMipsNop); /* delay slot */
         return 8;
     }
 }

 /*
  * Perform a "reg cmp imm" operation and jump to the PCR region if condition
  * satisfies.
  */
 static void genNegFloat(CompilationUnit *cUnit, RegLocation rlDest,
                         RegLocation rlSrc)
 {
     RegLocation rlResult;
     rlSrc = loadValue(cUnit, rlSrc, kCoreReg);
     rlResult = dvmCompilerEvalLoc(cUnit, rlDest, kCoreReg, true);
     opRegRegImm(cUnit, kOpAdd, rlResult.lowReg,
                 rlSrc.lowReg, 0x80000000);
     storeValue(cUnit, rlDest, rlResult);
 }

 static void genNegDouble(CompilationUnit *cUnit, RegLocation rlDest,
                          RegLocation rlSrc)
 {
     RegLocation rlResult;
     rlSrc = loadValueWide(cUnit, rlSrc, kCoreReg);
     rlResult = dvmCompilerEvalLoc(cUnit, rlDest, kCoreReg, true);
     opRegRegImm(cUnit, kOpAdd, rlResult.highReg, rlSrc.highReg,
                         0x80000000);
     genRegCopy(cUnit, rlResult.lowReg, rlSrc.lowReg);
     storeValueWide(cUnit, rlDest, rlResult);
 }

 static void genMulLong(CompilationUnit *cUnit, RegLocation rlDest,
                        RegLocation rlSrc1, RegLocation rlSrc2)
 {
     RegLocation rlResult;
     loadValueDirectWideFixed(cUnit, rlSrc1, r_ARG0, r_ARG1);
     loadValueDirectWideFixed(cUnit, rlSrc2, r_ARG2, r_ARG3);
     genDispatchToHandler(cUnit, TEMPLATE_MUL_LONG);
     rlResult = dvmCompilerGetReturnWide(cUnit);
     storeValueWide(cUnit, rlDest, rlResult);
 }

 static bool partialOverlap(int sreg1, int sreg2)
 {
     return abs(sreg1 - sreg2) == 1;
 }

 static void withCarryHelper(CompilationUnit *cUnit, MipsOpCode opc,
                             RegLocation rlDest, RegLocation rlSrc1,
                             RegLocation rlSrc2, int sltuSrc1, int sltuSrc2)
 {
     int tReg = dvmCompilerAllocTemp(cUnit);
     newLIR3(cUnit, opc, rlDest.lowReg, rlSrc1.lowReg, rlSrc2.lowReg);
     newLIR3(cUnit, kMipsSltu, tReg, sltuSrc1, sltuSrc2);
     newLIR3(cUnit, opc, rlDest.highReg, rlSrc1.highReg, rlSrc2.highReg);
     newLIR3(cUnit, opc, rlDest.highReg, rlDest.highReg, tReg);
     dvmCompilerFreeTemp(cUnit, tReg);
 }

 static void genLong3Addr(CompilationUnit *cUnit, MIR *mir, OpKind firstOp,
                          OpKind secondOp, RegLocation rlDest,
                          RegLocation rlSrc1, RegLocation rlSrc2)
 {
     RegLocation rlResult;
     int carryOp = (secondOp == kOpAdc || secondOp == kOpSbc);

     if (partialOverlap(rlSrc1.sRegLow,rlSrc2.sRegLow) ||
         partialOverlap(rlSrc1.sRegLow,rlDest.sRegLow) ||
         partialOverlap(rlSrc2.sRegLow,rlDest.sRegLow)) {
         // Rare case - not enough registers to properly handle
         genInterpSingleStep(cUnit, mir);
     } else if (rlDest.sRegLow == rlSrc1.sRegLow) {
         rlResult = loadValueWide(cUnit, rlDest, kCoreReg);
         rlSrc2 = loadValueWide(cUnit, rlSrc2, kCoreReg);
         if (!carryOp) {
             opRegRegReg(cUnit, firstOp, rlResult.lowReg, rlResult.lowReg, rlSrc2.lowReg);
             opRegRegReg(cUnit, secondOp, rlResult.highReg, rlResult.highReg, rlSrc2.highReg);
         } else if (secondOp == kOpAdc) {
             withCarryHelper(cUnit, kMipsAddu, rlResult, rlResult, rlSrc2,
                             rlResult.lowReg, rlSrc2.lowReg);
         } else {
             int tReg = dvmCompilerAllocTemp(cUnit);
             newLIR2(cUnit, kMipsMove, tReg, rlResult.lowReg);
             withCarryHelper(cUnit, kMipsSubu, rlResult, rlResult, rlSrc2,
                             tReg, rlResult.lowReg);
             dvmCompilerFreeTemp(cUnit, tReg);
         }
         storeValueWide(cUnit, rlDest, rlResult);
     } else if (rlDest.sRegLow == rlSrc2.sRegLow) {
         rlResult = loadValueWide(cUnit, rlDest, kCoreReg);
         rlSrc1 = loadValueWide(cUnit, rlSrc1, kCoreReg);
         if (!carryOp) {
             opRegRegReg(cUnit, firstOp, rlResult.lowReg, rlSrc1.lowReg, rlResult.lowReg);
             opRegRegReg(cUnit, secondOp, rlResult.highReg, rlSrc1.highReg, rlResult.highReg);
         } else if (secondOp == kOpAdc) {
             withCarryHelper(cUnit, kMipsAddu, rlResult, rlSrc1, rlResult,
                             rlResult.lowReg, rlSrc1.lowReg);
         } else {
             withCarryHelper(cUnit, kMipsSubu, rlResult, rlSrc1, rlResult,
                             rlSrc1.lowReg, rlResult.lowReg);
         }
         storeValueWide(cUnit, rlDest, rlResult);
     } else {
         rlSrc1 = loadValueWide(cUnit, rlSrc1, kCoreReg);
         rlSrc2 = loadValueWide(cUnit, rlSrc2, kCoreReg);
         rlResult = dvmCompilerEvalLoc(cUnit, rlDest, kCoreReg, true);
         if (!carryOp) {
             opRegRegReg(cUnit, firstOp, rlResult.lowReg, rlSrc1.lowReg, rlSrc2.lowReg);
             opRegRegReg(cUnit, secondOp, rlResult.highReg, rlSrc1.highReg, rlSrc2.highReg);
         } else if (secondOp == kOpAdc) {
             withCarryHelper(cUnit, kMipsAddu, rlResult, rlSrc1, rlSrc2,
                             rlResult.lowReg, rlSrc1.lowReg);
         } else {
             withCarryHelper(cUnit, kMipsSubu, rlResult, rlSrc1, rlSrc2,
                             rlSrc1.lowReg, rlResult.lowReg);
         }
         storeValueWide(cUnit, rlDest, rlResult);
     }
 }

 void dvmCompilerInitializeRegAlloc(CompilationUnit *cUnit)
 {
     int numTemps = sizeof(coreTemps)/sizeof(int);
     RegisterPool *pool = (RegisterPool *) dvmCompilerNew(sizeof(*pool), true);
     cUnit->regPool = pool;
     pool->numCoreTemps = numTemps;
     pool->coreTemps =
             (RegisterInfo *) dvmCompilerNew(numTemps * sizeof(*pool->coreTemps), true);
     dvmCompilerInitPool(pool->coreTemps, coreTemps, pool->numCoreTemps);
 #ifdef __mips_hard_float
     int numFPTemps = sizeof(fpTemps)/sizeof(int);
     pool->numFPTemps = numFPTemps;
     pool->FPTemps =
             (RegisterInfo *) dvmCompilerNew(numFPTemps * sizeof(*pool->FPTemps), true);
     dvmCompilerInitPool(pool->FPTemps, fpTemps, pool->numFPTemps);
 #else
     pool->numFPTemps = 0;
     pool->FPTemps = NULL;
     dvmCompilerInitPool(pool->FPTemps, NULL, 0);
 #endif
     pool->nullCheckedRegs =
         dvmCompilerAllocBitVector(cUnit->numSSARegs, false);
 }

 /* Export the Dalvik PC assicated with an instruction to the StackSave area */
 static MipsLIR *genExportPC(CompilationUnit *cUnit, MIR *mir)
 {
     MipsLIR *res;
     int rDPC = dvmCompilerAllocTemp(cUnit);
     int rAddr = dvmCompilerAllocTemp(cUnit);
     int offset = offsetof(StackSaveArea, xtra.currentPc);
     res = loadConstant(cUnit, rDPC, (int) (cUnit->method->insns + mir->offset));
     newLIR3(cUnit, kMipsAddiu, rAddr, rFP, -(sizeof(StackSaveArea) - offset));
     storeWordDisp( cUnit, rAddr, 0, rDPC);
     return res;
 }

 static void genMonitor(CompilationUnit *cUnit, MIR *mir)
 {
     genMonitorPortable(cUnit, mir);
 }

 static void genCmpLong(CompilationUnit *cUnit, MIR *mir, RegLocation rlDest,
                        RegLocation rlSrc1, RegLocation rlSrc2)
 {
     RegLocation rlResult;
     loadValueDirectWideFixed(cUnit, rlSrc1, r_ARG0, r_ARG1);
     loadValueDirectWideFixed(cUnit, rlSrc2, r_ARG2, r_ARG3);
     genDispatchToHandler(cUnit, TEMPLATE_CMP_LONG);
     rlResult = dvmCompilerGetReturn(cUnit);
     storeValue(cUnit, rlDest, rlResult);
 }

 static bool genInlinedAbsFloat(CompilationUnit *cUnit, MIR *mir)
 {
     int offset = offsetof(Thread, interpSave.retval);
     RegLocation rlSrc = dvmCompilerGetSrc(cUnit, mir, 0);
     int reg0 = loadValue(cUnit, rlSrc, kCoreReg).lowReg;
 #if __mips_isa_rev>=2
     newLIR4(cUnit, kMipsExt, reg0, reg0, 0, 31-1 /* size-1 */);
 #else
     newLIR2(cUnit, kMipsSll, reg0, 1);
     newLIR2(cUnit, kMipsSrl, reg0, 1);
 #endif
     storeWordDisp(cUnit, rSELF, offset, reg0);
     //TUNING: rewrite this to not clobber
     dvmCompilerClobber(cUnit, reg0);
     return false;
 }

 static bool genInlinedAbsDouble(CompilationUnit *cUnit, MIR *mir)
 {
     int offset = offsetof(Thread, interpSave.retval);
     RegLocation rlSrc = dvmCompilerGetSrcWide(cUnit, mir, 0, 1);
     RegLocation regSrc = loadValueWide(cUnit, rlSrc, kCoreReg);
     int reglo = regSrc.lowReg;
     int reghi = regSrc.highReg;
     storeWordDisp(cUnit, rSELF, offset + LOWORD_OFFSET, reglo);
 #if __mips_isa_rev>=2
     newLIR4(cUnit, kMipsExt, reghi, reghi, 0, 31-1 /* size-1 */);
 #else
     newLIR2(cUnit, kMipsSll, reghi, 1);
     newLIR2(cUnit, kMipsSrl, reghi, 1);
 #endif
     storeWordDisp(cUnit, rSELF, offset + HIWORD_OFFSET, reghi);
     //TUNING: rewrite this to not clobber
     dvmCompilerClobber(cUnit, reghi);
     return false;
 }

 /* No select in thumb, so we need to branch.  Thumb2 will do better */
 static bool genInlinedMinMaxInt(CompilationUnit *cUnit, MIR *mir, bool isMin)
 {
     int offset = offsetof(Thread, interpSave.retval);
     RegLocation rlSrc1 = dvmCompilerGetSrc(cUnit, mir, 0);
     RegLocation rlSrc2 = dvmCompilerGetSrc(cUnit, mir, 1);
     int reg0 = loadValue(cUnit, rlSrc1, kCoreReg).lowReg;
     int reg1 = loadValue(cUnit, rlSrc2, kCoreReg).lowReg;
     int tReg = dvmCompilerAllocTemp(cUnit);
     if (isMin) {
        newLIR3(cUnit, kMipsSlt, tReg, reg0, reg1);
     }
     else {
        newLIR3(cUnit, kMipsSlt, tReg, reg1, reg0);
     }
     newLIR3(cUnit, kMipsMovz, reg0, reg1, tReg);
     dvmCompilerFreeTemp(cUnit, tReg);
     newLIR3(cUnit, kMipsSw, reg0, offset, rSELF);
     //TUNING: rewrite this to not clobber
     dvmCompilerClobber(cUnit,reg0);
     return false;
 }

 static void genMultiplyByTwoBitMultiplier(CompilationUnit *cUnit,
         RegLocation rlSrc, RegLocation rlResult, int lit,
         int firstBit, int secondBit)
 {
     // We can't implement "add src, src, src, lsl#shift" on Thumb, so we have
     // to do a regular multiply.
     opRegRegImm(cUnit, kOpMul, rlResult.lowReg, rlSrc.lowReg, lit);
 }
	/*
	* Copyright (C) 2009 The Android Open Source Project
	*
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	/*
	* This file contains codegen for the Mips ISA and is intended to be
	* includes by:
	*
	* Codegen-$(TARGET_ARCH_VARIANT).c
	*
	*/

	/*
	* Reserve 8 bytes at the beginning of the trace
	* +----------------------------+
	* \| prof count addr (4 bytes) \|
	* +----------------------------+
	* \| chain cell offset (4 bytes)\|
	* +----------------------------+
	*
	* ...and then code to increment the execution
	*
	* For continuous profiling (24 bytes)
	* lahi a0, addr # get ptr to prof count addr into a0
	* lalo a0, addr
	* lw a0, 0(a0) # read prof count addr into a0
	* lw a1, 0(a0) # read prof count into a1
	* addiu a1, a1, 1 # increment count
	* sw a1, 0(a0) # store count
	*
	* For periodic profiling (8 bytes)
	* call TEMPLATE_PERIODIC_PROFILING
	* nop
	*
	* and return the size (in bytes) of the generated code.
	*/
	static int genTraceProfileEntry(CompilationUnit *cUnit)
	{
	intptr_t addr = (intptr_t)dvmJitNextTraceCounter();
	assert(__BYTE_ORDER == __LITTLE_ENDIAN);
	MipsLIR *executionCount = newLIR1(cUnit, kMips32BitData, addr);
	cUnit->chainCellOffsetLIR =
	(LIR *) newLIR1(cUnit, kMips32BitData, CHAIN_CELL_OFFSET_TAG);
	cUnit->headerSize = 8;
	if ((gDvmJit.profileMode == kTraceProfilingContinuous) \|\|
	(gDvmJit.profileMode == kTraceProfilingDisabled)) {
	MipsLIR *loadAddr = newLIR2(cUnit, kMipsLahi, r_A0, 0);
	loadAddr->generic.target = (LIR *) executionCount;
	loadAddr = newLIR3(cUnit, kMipsLalo, r_A0, r_A0, 0);
	loadAddr ->generic.target = (LIR *) executionCount;
	newLIR3(cUnit, kMipsLw, r_A0, 0, r_A0);
	newLIR3(cUnit, kMipsLw, r_A1, 0, r_A0);
	newLIR3(cUnit, kMipsAddiu, r_A1, r_A1, 1);
	newLIR3(cUnit, kMipsSw, r_A1, 0, r_A0);
	return 24;
	} else {
	int opcode = TEMPLATE_PERIODIC_PROFILING;
	newLIR1(cUnit, kMipsJal,
	(int) gDvmJit.codeCache + templateEntryOffsets[opcode]);
	newLIR0(cUnit, kMipsNop); /* delay slot */
	return 8;
	}
	}

	/*
	* Perform a "reg cmp imm" operation and jump to the PCR region if condition
	* satisfies.
	*/
	static void genNegFloat(CompilationUnit *cUnit, RegLocation rlDest,
	RegLocation rlSrc)
	{
	RegLocation rlResult;
	rlSrc = loadValue(cUnit, rlSrc, kCoreReg);
	rlResult = dvmCompilerEvalLoc(cUnit, rlDest, kCoreReg, true);
	opRegRegImm(cUnit, kOpAdd, rlResult.lowReg,
	rlSrc.lowReg, 0x80000000);
	storeValue(cUnit, rlDest, rlResult);
	}

	static void genNegDouble(CompilationUnit *cUnit, RegLocation rlDest,
	RegLocation rlSrc)
	{
	RegLocation rlResult;
	rlSrc = loadValueWide(cUnit, rlSrc, kCoreReg);
	rlResult = dvmCompilerEvalLoc(cUnit, rlDest, kCoreReg, true);
	opRegRegImm(cUnit, kOpAdd, rlResult.highReg, rlSrc.highReg,
	0x80000000);
	genRegCopy(cUnit, rlResult.lowReg, rlSrc.lowReg);
	storeValueWide(cUnit, rlDest, rlResult);
	}

	static void genMulLong(CompilationUnit *cUnit, RegLocation rlDest,
	RegLocation rlSrc1, RegLocation rlSrc2)
	{
	RegLocation rlResult;
	loadValueDirectWideFixed(cUnit, rlSrc1, r_ARG0, r_ARG1);
	loadValueDirectWideFixed(cUnit, rlSrc2, r_ARG2, r_ARG3);
	genDispatchToHandler(cUnit, TEMPLATE_MUL_LONG);
	rlResult = dvmCompilerGetReturnWide(cUnit);
	storeValueWide(cUnit, rlDest, rlResult);
	}

	static bool partialOverlap(int sreg1, int sreg2)
	{
	return abs(sreg1 - sreg2) == 1;
	}

	static void withCarryHelper(CompilationUnit *cUnit, MipsOpCode opc,
	RegLocation rlDest, RegLocation rlSrc1,
	RegLocation rlSrc2, int sltuSrc1, int sltuSrc2)
	{
	int tReg = dvmCompilerAllocTemp(cUnit);
	newLIR3(cUnit, opc, rlDest.lowReg, rlSrc1.lowReg, rlSrc2.lowReg);
	newLIR3(cUnit, kMipsSltu, tReg, sltuSrc1, sltuSrc2);
	newLIR3(cUnit, opc, rlDest.highReg, rlSrc1.highReg, rlSrc2.highReg);
	newLIR3(cUnit, opc, rlDest.highReg, rlDest.highReg, tReg);
	dvmCompilerFreeTemp(cUnit, tReg);
	}

	static void genLong3Addr(CompilationUnit cUnit, MIR mir, OpKind firstOp,
	OpKind secondOp, RegLocation rlDest,
	RegLocation rlSrc1, RegLocation rlSrc2)
	{
	RegLocation rlResult;
	int carryOp = (secondOp == kOpAdc \|\| secondOp == kOpSbc);

	if (partialOverlap(rlSrc1.sRegLow,rlSrc2.sRegLow) \|\|
	partialOverlap(rlSrc1.sRegLow,rlDest.sRegLow) \|\|
	partialOverlap(rlSrc2.sRegLow,rlDest.sRegLow)) {
	// Rare case - not enough registers to properly handle
	genInterpSingleStep(cUnit, mir);
	} else if (rlDest.sRegLow == rlSrc1.sRegLow) {
	rlResult = loadValueWide(cUnit, rlDest, kCoreReg);
	rlSrc2 = loadValueWide(cUnit, rlSrc2, kCoreReg);
	if (!carryOp) {
	opRegRegReg(cUnit, firstOp, rlResult.lowReg, rlResult.lowReg, rlSrc2.lowReg);
	opRegRegReg(cUnit, secondOp, rlResult.highReg, rlResult.highReg, rlSrc2.highReg);
	} else if (secondOp == kOpAdc) {
	withCarryHelper(cUnit, kMipsAddu, rlResult, rlResult, rlSrc2,
	rlResult.lowReg, rlSrc2.lowReg);
	} else {
	int tReg = dvmCompilerAllocTemp(cUnit);
	newLIR2(cUnit, kMipsMove, tReg, rlResult.lowReg);
	withCarryHelper(cUnit, kMipsSubu, rlResult, rlResult, rlSrc2,
	tReg, rlResult.lowReg);
	dvmCompilerFreeTemp(cUnit, tReg);
	}
	storeValueWide(cUnit, rlDest, rlResult);
	} else if (rlDest.sRegLow == rlSrc2.sRegLow) {
	rlResult = loadValueWide(cUnit, rlDest, kCoreReg);
	rlSrc1 = loadValueWide(cUnit, rlSrc1, kCoreReg);
	if (!carryOp) {
	opRegRegReg(cUnit, firstOp, rlResult.lowReg, rlSrc1.lowReg, rlResult.lowReg);
	opRegRegReg(cUnit, secondOp, rlResult.highReg, rlSrc1.highReg, rlResult.highReg);
	} else if (secondOp == kOpAdc) {
	withCarryHelper(cUnit, kMipsAddu, rlResult, rlSrc1, rlResult,
	rlResult.lowReg, rlSrc1.lowReg);
	} else {
	withCarryHelper(cUnit, kMipsSubu, rlResult, rlSrc1, rlResult,
	rlSrc1.lowReg, rlResult.lowReg);
	}
	storeValueWide(cUnit, rlDest, rlResult);
	} else {
	rlSrc1 = loadValueWide(cUnit, rlSrc1, kCoreReg);
	rlSrc2 = loadValueWide(cUnit, rlSrc2, kCoreReg);
	rlResult = dvmCompilerEvalLoc(cUnit, rlDest, kCoreReg, true);
	if (!carryOp) {
	opRegRegReg(cUnit, firstOp, rlResult.lowReg, rlSrc1.lowReg, rlSrc2.lowReg);
	opRegRegReg(cUnit, secondOp, rlResult.highReg, rlSrc1.highReg, rlSrc2.highReg);
	} else if (secondOp == kOpAdc) {
	withCarryHelper(cUnit, kMipsAddu, rlResult, rlSrc1, rlSrc2,
	rlResult.lowReg, rlSrc1.lowReg);
	} else {
	withCarryHelper(cUnit, kMipsSubu, rlResult, rlSrc1, rlSrc2,
	rlSrc1.lowReg, rlResult.lowReg);
	}
	storeValueWide(cUnit, rlDest, rlResult);
	}
	}

	void dvmCompilerInitializeRegAlloc(CompilationUnit *cUnit)
	{
	int numTemps = sizeof(coreTemps)/sizeof(int);
	RegisterPool pool = (RegisterPool ) dvmCompilerNew(sizeof(*pool), true);
	cUnit->regPool = pool;
	pool->numCoreTemps = numTemps;
	pool->coreTemps =
	(RegisterInfo ) dvmCompilerNew(numTemps sizeof(*pool->coreTemps), true);
	dvmCompilerInitPool(pool->coreTemps, coreTemps, pool->numCoreTemps);
	#ifdef __mips_hard_float
	int numFPTemps = sizeof(fpTemps)/sizeof(int);
	pool->numFPTemps = numFPTemps;
	pool->FPTemps =
	(RegisterInfo ) dvmCompilerNew(numFPTemps sizeof(*pool->FPTemps), true);
	dvmCompilerInitPool(pool->FPTemps, fpTemps, pool->numFPTemps);
	#else
	pool->numFPTemps = 0;
	pool->FPTemps = NULL;
	dvmCompilerInitPool(pool->FPTemps, NULL, 0);
	#endif
	pool->nullCheckedRegs =
	dvmCompilerAllocBitVector(cUnit->numSSARegs, false);
	}

	/* Export the Dalvik PC assicated with an instruction to the StackSave area */
	static MipsLIR genExportPC(CompilationUnit cUnit, MIR *mir)
	{
	MipsLIR *res;
	int rDPC = dvmCompilerAllocTemp(cUnit);
	int rAddr = dvmCompilerAllocTemp(cUnit);
	int offset = offsetof(StackSaveArea, xtra.currentPc);
	res = loadConstant(cUnit, rDPC, (int) (cUnit->method->insns + mir->offset));
	newLIR3(cUnit, kMipsAddiu, rAddr, rFP, -(sizeof(StackSaveArea) - offset));
	storeWordDisp( cUnit, rAddr, 0, rDPC);
	return res;
	}

	static void genMonitor(CompilationUnit cUnit, MIR mir)
	{
	genMonitorPortable(cUnit, mir);
	}

	static void genCmpLong(CompilationUnit cUnit, MIR mir, RegLocation rlDest,
	RegLocation rlSrc1, RegLocation rlSrc2)
	{
	RegLocation rlResult;
	loadValueDirectWideFixed(cUnit, rlSrc1, r_ARG0, r_ARG1);
	loadValueDirectWideFixed(cUnit, rlSrc2, r_ARG2, r_ARG3);
	genDispatchToHandler(cUnit, TEMPLATE_CMP_LONG);
	rlResult = dvmCompilerGetReturn(cUnit);
	storeValue(cUnit, rlDest, rlResult);
	}

	static bool genInlinedAbsFloat(CompilationUnit cUnit, MIR mir)
	{
	int offset = offsetof(Thread, interpSave.retval);
	RegLocation rlSrc = dvmCompilerGetSrc(cUnit, mir, 0);
	int reg0 = loadValue(cUnit, rlSrc, kCoreReg).lowReg;
	#if __mips_isa_rev>=2
	newLIR4(cUnit, kMipsExt, reg0, reg0, 0, 31-1 /* size-1 */);
	#else
	newLIR2(cUnit, kMipsSll, reg0, 1);
	newLIR2(cUnit, kMipsSrl, reg0, 1);
	#endif
	storeWordDisp(cUnit, rSELF, offset, reg0);
	//TUNING: rewrite this to not clobber
	dvmCompilerClobber(cUnit, reg0);
	return false;
	}

	static bool genInlinedAbsDouble(CompilationUnit cUnit, MIR mir)
	{
	int offset = offsetof(Thread, interpSave.retval);
	RegLocation rlSrc = dvmCompilerGetSrcWide(cUnit, mir, 0, 1);
	RegLocation regSrc = loadValueWide(cUnit, rlSrc, kCoreReg);
	int reglo = regSrc.lowReg;
	int reghi = regSrc.highReg;
	storeWordDisp(cUnit, rSELF, offset + LOWORD_OFFSET, reglo);
	#if __mips_isa_rev>=2
	newLIR4(cUnit, kMipsExt, reghi, reghi, 0, 31-1 /* size-1 */);
	#else
	newLIR2(cUnit, kMipsSll, reghi, 1);
	newLIR2(cUnit, kMipsSrl, reghi, 1);
	#endif
	storeWordDisp(cUnit, rSELF, offset + HIWORD_OFFSET, reghi);
	//TUNING: rewrite this to not clobber
	dvmCompilerClobber(cUnit, reghi);
	return false;
	}

	/* No select in thumb, so we need to branch. Thumb2 will do better */
	static bool genInlinedMinMaxInt(CompilationUnit cUnit, MIR mir, bool isMin)
	{
	int offset = offsetof(Thread, interpSave.retval);
	RegLocation rlSrc1 = dvmCompilerGetSrc(cUnit, mir, 0);
	RegLocation rlSrc2 = dvmCompilerGetSrc(cUnit, mir, 1);
	int reg0 = loadValue(cUnit, rlSrc1, kCoreReg).lowReg;
	int reg1 = loadValue(cUnit, rlSrc2, kCoreReg).lowReg;
	int tReg = dvmCompilerAllocTemp(cUnit);
	if (isMin) {
	newLIR3(cUnit, kMipsSlt, tReg, reg0, reg1);
	}
	else {
	newLIR3(cUnit, kMipsSlt, tReg, reg1, reg0);
	}
	newLIR3(cUnit, kMipsMovz, reg0, reg1, tReg);
	dvmCompilerFreeTemp(cUnit, tReg);
	newLIR3(cUnit, kMipsSw, reg0, offset, rSELF);
	//TUNING: rewrite this to not clobber
	dvmCompilerClobber(cUnit,reg0);
	return false;
	}

	static void genMultiplyByTwoBitMultiplier(CompilationUnit *cUnit,
	RegLocation rlSrc, RegLocation rlResult, int lit,
	int firstBit, int secondBit)
	{
	// We can't implement "add src, src, src, lsl#shift" on Thumb, so we have
	// to do a regular multiply.
	opRegRegImm(cUnit, kOpMul, rlResult.lowReg, rlSrc.lowReg, lit);
	}