buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2012 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
| 17 | /* |
buzbee | a7678db | 2012-03-05 15:35:46 -0800 | [diff] [blame] | 18 | * This file contains codegen for the X86 ISA and is intended to be |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 19 | * includes by: |
| 20 | * |
| 21 | * Codegen-$(TARGET_ARCH_VARIANT).c |
| 22 | * |
| 23 | */ |
| 24 | |
| 25 | namespace art { |
| 26 | |
buzbee | 16da88c | 2012-03-20 10:38:17 -0700 | [diff] [blame] | 27 | void genSpecialCase(CompilationUnit* cUnit, BasicBlock* bb, MIR* mir, |
| 28 | SpecialCaseHandler specialCase) |
| 29 | { |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 30 | // TODO |
buzbee | 16da88c | 2012-03-20 10:38:17 -0700 | [diff] [blame] | 31 | } |
| 32 | |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 33 | /* |
Ian Rogers | b5d09b2 | 2012-03-06 22:14:17 -0800 | [diff] [blame] | 34 | * Perform register memory operation. |
| 35 | */ |
| 36 | LIR* genRegMemCheck(CompilationUnit* cUnit, ConditionCode cCode, |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 37 | int reg1, int base, int offset, ThrowKind kind) |
Ian Rogers | b5d09b2 | 2012-03-06 22:14:17 -0800 | [diff] [blame] | 38 | { |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 39 | LIR* tgt = rawLIR(cUnit, 0, kPseudoThrowTarget, kind, |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 40 | cUnit->currentDalvikOffset, reg1, base, offset); |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 41 | opRegMem(cUnit, kOpCmp, reg1, base, offset); |
| 42 | LIR* branch = opCondBranch(cUnit, cCode, tgt); |
| 43 | // Remember branch target - will process later |
| 44 | oatInsertGrowableList(cUnit, &cUnit->throwLaunchpads, (intptr_t)tgt); |
| 45 | return branch; |
Ian Rogers | b5d09b2 | 2012-03-06 22:14:17 -0800 | [diff] [blame] | 46 | } |
| 47 | |
| 48 | /* |
Ian Rogers | 55bd45f | 2012-04-04 17:31:20 -0700 | [diff] [blame] | 49 | * The sparse table in the literal pool is an array of <key,displacement> |
| 50 | * pairs. |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 51 | */ |
Ian Rogers | 55bd45f | 2012-04-04 17:31:20 -0700 | [diff] [blame] | 52 | BasicBlock *findBlock(CompilationUnit* cUnit, unsigned int codeOffset, |
| 53 | bool split, bool create, BasicBlock** immedPredBlockP); |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 54 | void genSparseSwitch(CompilationUnit* cUnit, uint32_t tableOffset, |
buzbee | a1da8a5 | 2012-07-09 14:00:21 -0700 | [diff] [blame] | 55 | RegLocation rlSrc) |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 56 | { |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 57 | const u2* table = cUnit->insns + cUnit->currentDalvikOffset + tableOffset; |
Ian Rogers | 55bd45f | 2012-04-04 17:31:20 -0700 | [diff] [blame] | 58 | if (cUnit->printMe) { |
| 59 | dumpSparseSwitchTable(table); |
| 60 | } |
| 61 | int entries = table[1]; |
| 62 | int* keys = (int*)&table[2]; |
| 63 | int* targets = &keys[entries]; |
| 64 | rlSrc = loadValue(cUnit, rlSrc, kCoreReg); |
| 65 | for (int i = 0; i < entries; i++) { |
| 66 | int key = keys[i]; |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 67 | BasicBlock* case_block = findBlock(cUnit, |
| 68 | cUnit->currentDalvikOffset + targets[i], |
Ian Rogers | 55bd45f | 2012-04-04 17:31:20 -0700 | [diff] [blame] | 69 | false, false, NULL); |
buzbee | a1da8a5 | 2012-07-09 14:00:21 -0700 | [diff] [blame] | 70 | LIR* labelList = cUnit->blockLabelList; |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 71 | opCmpImmBranch(cUnit, kCondEq, rlSrc.lowReg, key, |
| 72 | &labelList[case_block->id]); |
Ian Rogers | 55bd45f | 2012-04-04 17:31:20 -0700 | [diff] [blame] | 73 | } |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 74 | } |
| 75 | |
| 76 | /* |
| 77 | * Code pattern will look something like: |
| 78 | * |
Ian Rogers | 55bd45f | 2012-04-04 17:31:20 -0700 | [diff] [blame] | 79 | * mov rVal, .. |
| 80 | * call 0 |
| 81 | * pop rStartOfMethod |
| 82 | * sub rStartOfMethod, .. |
| 83 | * mov rKeyReg, rVal |
| 84 | * sub rKeyReg, lowKey |
| 85 | * cmp rKeyReg, size-1 ; bound check |
| 86 | * ja done |
| 87 | * mov rDisp, [rStartOfMethod + rKeyReg * 4 + tableOffset] |
| 88 | * add rStartOfMethod, rDisp |
| 89 | * jmp rStartOfMethod |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 90 | * done: |
| 91 | */ |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 92 | void genPackedSwitch(CompilationUnit* cUnit, uint32_t tableOffset, |
| 93 | RegLocation rlSrc) |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 94 | { |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 95 | const u2* table = cUnit->insns + cUnit->currentDalvikOffset + tableOffset; |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 96 | if (cUnit->printMe) { |
| 97 | dumpPackedSwitchTable(table); |
| 98 | } |
| 99 | // Add the table to the list - we'll process it later |
| 100 | SwitchTable *tabRec = (SwitchTable *)oatNew(cUnit, sizeof(SwitchTable), |
| 101 | true, kAllocData); |
| 102 | tabRec->table = table; |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 103 | tabRec->vaddr = cUnit->currentDalvikOffset; |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 104 | int size = table[1]; |
| 105 | tabRec->targets = (LIR* *)oatNew(cUnit, size * sizeof(LIR*), true, |
| 106 | kAllocLIR); |
| 107 | oatInsertGrowableList(cUnit, &cUnit->switchTables, (intptr_t)tabRec); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 108 | |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 109 | // Get the switch value |
| 110 | rlSrc = loadValue(cUnit, rlSrc, kCoreReg); |
| 111 | int startOfMethodReg = oatAllocTemp(cUnit); |
| 112 | // Materialize a pointer to the switch table |
| 113 | //newLIR0(cUnit, kX86Bkpt); |
| 114 | newLIR1(cUnit, kX86StartOfMethod, startOfMethodReg); |
| 115 | int lowKey = s4FromSwitchData(&table[2]); |
| 116 | int keyReg; |
| 117 | // Remove the bias, if necessary |
| 118 | if (lowKey == 0) { |
| 119 | keyReg = rlSrc.lowReg; |
| 120 | } else { |
| 121 | keyReg = oatAllocTemp(cUnit); |
| 122 | opRegRegImm(cUnit, kOpSub, keyReg, rlSrc.lowReg, lowKey); |
| 123 | } |
| 124 | // Bounds check - if < 0 or >= size continue following switch |
| 125 | opRegImm(cUnit, kOpCmp, keyReg, size-1); |
| 126 | LIR* branchOver = opCondBranch(cUnit, kCondHi, NULL); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 127 | |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 128 | // Load the displacement from the switch table |
| 129 | int dispReg = oatAllocTemp(cUnit); |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 130 | newLIR5(cUnit, kX86PcRelLoadRA, dispReg, startOfMethodReg, keyReg, 2, |
| 131 | (intptr_t)tabRec); |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 132 | // Add displacement to start of method |
| 133 | opRegReg(cUnit, kOpAdd, startOfMethodReg, dispReg); |
| 134 | // ..and go! |
| 135 | LIR* switchBranch = newLIR1(cUnit, kX86JmpR, startOfMethodReg); |
| 136 | tabRec->anchor = switchBranch; |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 137 | |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 138 | /* branchOver target here */ |
| 139 | LIR* target = newLIR0(cUnit, kPseudoTargetLabel); |
| 140 | branchOver->target = (LIR*)target; |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 141 | } |
| 142 | |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 143 | void callRuntimeHelperRegReg(CompilationUnit* cUnit, int helperOffset, |
buzbee | 8320f38 | 2012-09-11 16:29:42 -0700 | [diff] [blame] | 144 | int arg0, int arg1, bool safepointPC); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 145 | /* |
| 146 | * Array data table format: |
| 147 | * ushort ident = 0x0300 magic value |
| 148 | * ushort width width of each element in the table |
| 149 | * uint size number of elements in the table |
| 150 | * ubyte data[size*width] table of data values (may contain a single-byte |
| 151 | * padding at the end) |
| 152 | * |
| 153 | * Total size is 4+(width * size + 1)/2 16-bit code units. |
| 154 | */ |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 155 | void genFillArrayData(CompilationUnit* cUnit, uint32_t tableOffset, |
| 156 | RegLocation rlSrc) |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 157 | { |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 158 | const u2* table = cUnit->insns + cUnit->currentDalvikOffset + tableOffset; |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 159 | // Add the table to the list - we'll process it later |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 160 | FillArrayData *tabRec = (FillArrayData *)oatNew(cUnit, sizeof(FillArrayData), |
| 161 | true, kAllocData); |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 162 | tabRec->table = table; |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 163 | tabRec->vaddr = cUnit->currentDalvikOffset; |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 164 | u2 width = tabRec->table[1]; |
| 165 | u4 size = tabRec->table[2] | (((u4)tabRec->table[3]) << 16); |
| 166 | tabRec->size = (size * width) + 8; |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 167 | |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 168 | oatInsertGrowableList(cUnit, &cUnit->fillArrayData, (intptr_t)tabRec); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 169 | |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 170 | // Making a call - use explicit registers |
| 171 | oatFlushAllRegs(cUnit); /* Everything to home location */ |
| 172 | loadValueDirectFixed(cUnit, rlSrc, rARG0); |
| 173 | // Materialize a pointer to the fill data image |
| 174 | newLIR1(cUnit, kX86StartOfMethod, rARG2); |
| 175 | newLIR2(cUnit, kX86PcRelAdr, rARG1, (intptr_t)tabRec); |
| 176 | newLIR2(cUnit, kX86Add32RR, rARG1, rARG2); |
buzbee | 8320f38 | 2012-09-11 16:29:42 -0700 | [diff] [blame] | 177 | callRuntimeHelperRegReg(cUnit, ENTRYPOINT_OFFSET(pHandleFillArrayDataFromCode), rARG0, rARG1, |
| 178 | true); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 179 | } |
| 180 | |
| 181 | void genNegFloat(CompilationUnit *cUnit, RegLocation rlDest, RegLocation rlSrc) |
| 182 | { |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 183 | RegLocation rlResult; |
| 184 | rlSrc = loadValue(cUnit, rlSrc, kCoreReg); |
| 185 | rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true); |
| 186 | opRegRegImm(cUnit, kOpAdd, rlResult.lowReg, rlSrc.lowReg, 0x80000000); |
| 187 | storeValue(cUnit, rlDest, rlResult); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 188 | } |
| 189 | |
| 190 | void genNegDouble(CompilationUnit *cUnit, RegLocation rlDest, RegLocation rlSrc) |
| 191 | { |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 192 | RegLocation rlResult; |
| 193 | rlSrc = loadValueWide(cUnit, rlSrc, kCoreReg); |
| 194 | rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true); |
| 195 | opRegRegImm(cUnit, kOpAdd, rlResult.highReg, rlSrc.highReg, 0x80000000); |
| 196 | opRegCopy(cUnit, rlResult.lowReg, rlSrc.lowReg); |
| 197 | storeValueWide(cUnit, rlDest, rlResult); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 198 | } |
| 199 | |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 200 | LIR* genNullCheck(CompilationUnit* cUnit, int sReg, int mReg, int optFlags); |
buzbee | 8320f38 | 2012-09-11 16:29:42 -0700 | [diff] [blame] | 201 | void callRuntimeHelperReg(CompilationUnit* cUnit, int helperOffset, int arg0, bool safepointPC); |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 202 | |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 203 | void genMonitorEnter(CompilationUnit* cUnit, int optFlags, RegLocation rlSrc) |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 204 | { |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 205 | oatFlushAllRegs(cUnit); |
jeffhao | 8302576 | 2012-08-02 11:08:56 -0700 | [diff] [blame] | 206 | loadValueDirectFixed(cUnit, rlSrc, rCX); // Get obj |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 207 | oatLockCallTemps(cUnit); // Prepare for explicit register usage |
jeffhao | 8302576 | 2012-08-02 11:08:56 -0700 | [diff] [blame] | 208 | genNullCheck(cUnit, rlSrc.sRegLow, rCX, optFlags); |
| 209 | // If lock is unheld, try to grab it quickly with compare and exchange |
| 210 | // TODO: copy and clear hash state? |
| 211 | newLIR2(cUnit, kX86Mov32RT, rDX, Thread::ThinLockIdOffset().Int32Value()); |
| 212 | newLIR2(cUnit, kX86Sal32RI, rDX, LW_LOCK_OWNER_SHIFT); |
| 213 | newLIR2(cUnit, kX86Xor32RR, rAX, rAX); |
| 214 | newLIR3(cUnit, kX86LockCmpxchgMR, rCX, Object::MonitorOffset().Int32Value(), rDX); |
| 215 | LIR* branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondEq); |
| 216 | // If lock is held, go the expensive route - artLockObjectFromCode(self, obj); |
buzbee | 8320f38 | 2012-09-11 16:29:42 -0700 | [diff] [blame] | 217 | callRuntimeHelperReg(cUnit, ENTRYPOINT_OFFSET(pLockObjectFromCode), rCX, true); |
jeffhao | 8302576 | 2012-08-02 11:08:56 -0700 | [diff] [blame] | 218 | branch->target = newLIR0(cUnit, kPseudoTargetLabel); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 219 | } |
| 220 | |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 221 | void genMonitorExit(CompilationUnit* cUnit, int optFlags, RegLocation rlSrc) |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 222 | { |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 223 | oatFlushAllRegs(cUnit); |
jeffhao | 8302576 | 2012-08-02 11:08:56 -0700 | [diff] [blame] | 224 | loadValueDirectFixed(cUnit, rlSrc, rAX); // Get obj |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 225 | oatLockCallTemps(cUnit); // Prepare for explicit register usage |
jeffhao | 8302576 | 2012-08-02 11:08:56 -0700 | [diff] [blame] | 226 | genNullCheck(cUnit, rlSrc.sRegLow, rAX, optFlags); |
| 227 | // If lock is held by the current thread, clear it to quickly release it |
| 228 | // TODO: clear hash state? |
| 229 | newLIR2(cUnit, kX86Mov32RT, rDX, Thread::ThinLockIdOffset().Int32Value()); |
| 230 | newLIR2(cUnit, kX86Sal32RI, rDX, LW_LOCK_OWNER_SHIFT); |
| 231 | newLIR3(cUnit, kX86Mov32RM, rCX, rAX, Object::MonitorOffset().Int32Value()); |
| 232 | opRegReg(cUnit, kOpSub, rCX, rDX); |
| 233 | LIR* branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondNe); |
| 234 | newLIR3(cUnit, kX86Mov32MR, rAX, Object::MonitorOffset().Int32Value(), rCX); |
| 235 | LIR* branch2 = newLIR1(cUnit, kX86Jmp8, 0); |
| 236 | branch->target = newLIR0(cUnit, kPseudoTargetLabel); |
| 237 | // Otherwise, go the expensive route - UnlockObjectFromCode(obj); |
buzbee | 8320f38 | 2012-09-11 16:29:42 -0700 | [diff] [blame] | 238 | callRuntimeHelperReg(cUnit, ENTRYPOINT_OFFSET(pUnlockObjectFromCode), rAX, true); |
jeffhao | 8302576 | 2012-08-02 11:08:56 -0700 | [diff] [blame] | 239 | branch2->target = newLIR0(cUnit, kPseudoTargetLabel); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 240 | } |
| 241 | |
| 242 | /* |
| 243 | * Compare two 64-bit values |
| 244 | * x = y return 0 |
| 245 | * x < y return -1 |
| 246 | * x > y return 1 |
| 247 | * |
| 248 | * slt t0, x.hi, y.hi; # (x.hi < y.hi) ? 1:0 |
| 249 | * sgt t1, x.hi, y.hi; # (y.hi > x.hi) ? 1:0 |
| 250 | * subu res, t0, t1 # res = -1:1:0 for [ < > = ] |
| 251 | * bnez res, finish |
| 252 | * sltu t0, x.lo, y.lo |
| 253 | * sgtu r1, x.lo, y.lo |
| 254 | * subu res, t0, t1 |
| 255 | * finish: |
| 256 | * |
| 257 | */ |
buzbee | 408ad16 | 2012-06-06 16:45:18 -0700 | [diff] [blame] | 258 | void genCmpLong(CompilationUnit* cUnit, RegLocation rlDest, |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 259 | RegLocation rlSrc1, RegLocation rlSrc2) |
| 260 | { |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 261 | oatFlushAllRegs(cUnit); |
| 262 | oatLockCallTemps(cUnit); // Prepare for explicit register usage |
| 263 | loadValueDirectWideFixed(cUnit, rlSrc1, r0, r1); |
jeffhao | 644d531 | 2012-05-03 19:04:49 -0700 | [diff] [blame] | 264 | loadValueDirectWideFixed(cUnit, rlSrc2, r2, r3); |
| 265 | // Compute (r1:r0) = (r1:r0) - (r3:r2) |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 266 | opRegReg(cUnit, kOpSub, r0, r2); // r0 = r0 - r2 |
| 267 | opRegReg(cUnit, kOpSbc, r1, r3); // r1 = r1 - r3 - CF |
jeffhao | 1395b1e | 2012-06-13 18:05:13 -0700 | [diff] [blame] | 268 | newLIR2(cUnit, kX86Set8R, r2, kX86CondL); // r2 = (r1:r0) < (r3:r2) ? 1 : 0 |
| 269 | newLIR2(cUnit, kX86Movzx8RR, r2, r2); |
| 270 | opReg(cUnit, kOpNeg, r2); // r2 = -r2 |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 271 | opRegReg(cUnit, kOpOr, r0, r1); // r0 = high | low - sets ZF |
jeffhao | 644d531 | 2012-05-03 19:04:49 -0700 | [diff] [blame] | 272 | newLIR2(cUnit, kX86Set8R, r0, kX86CondNz); // r0 = (r1:r0) != (r3:r2) ? 1 : 0 |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 273 | newLIR2(cUnit, kX86Movzx8RR, r0, r0); |
jeffhao | 1395b1e | 2012-06-13 18:05:13 -0700 | [diff] [blame] | 274 | opRegReg(cUnit, kOpOr, r0, r2); // r0 = r0 | r2 |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 275 | RegLocation rlResult = LOC_C_RETURN; |
| 276 | storeValue(cUnit, rlDest, rlResult); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 277 | } |
| 278 | |
Ian Rogers | b5d09b2 | 2012-03-06 22:14:17 -0800 | [diff] [blame] | 279 | X86ConditionCode oatX86ConditionEncoding(ConditionCode cond) { |
Elliott Hughes | b25c3f6 | 2012-03-26 16:35:06 -0700 | [diff] [blame] | 280 | switch (cond) { |
Ian Rogers | b5d09b2 | 2012-03-06 22:14:17 -0800 | [diff] [blame] | 281 | case kCondEq: return kX86CondEq; |
| 282 | case kCondNe: return kX86CondNe; |
| 283 | case kCondCs: return kX86CondC; |
| 284 | case kCondCc: return kX86CondNc; |
| 285 | case kCondMi: return kX86CondS; |
| 286 | case kCondPl: return kX86CondNs; |
| 287 | case kCondVs: return kX86CondO; |
| 288 | case kCondVc: return kX86CondNo; |
| 289 | case kCondHi: return kX86CondA; |
| 290 | case kCondLs: return kX86CondBe; |
| 291 | case kCondGe: return kX86CondGe; |
| 292 | case kCondLt: return kX86CondL; |
| 293 | case kCondGt: return kX86CondG; |
| 294 | case kCondLe: return kX86CondLe; |
| 295 | case kCondAl: |
| 296 | case kCondNv: LOG(FATAL) << "Should not reach here"; |
| 297 | } |
| 298 | return kX86CondO; |
| 299 | } |
| 300 | |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 301 | LIR* opCmpBranch(CompilationUnit* cUnit, ConditionCode cond, int src1, |
| 302 | int src2, LIR* target) |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 303 | { |
Ian Rogers | b5d09b2 | 2012-03-06 22:14:17 -0800 | [diff] [blame] | 304 | newLIR2(cUnit, kX86Cmp32RR, src1, src2); |
| 305 | X86ConditionCode cc = oatX86ConditionEncoding(cond); |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 306 | LIR* branch = newLIR2(cUnit, kX86Jcc8, 0 /* lir operand for Jcc offset */ , |
| 307 | cc); |
Ian Rogers | b5d09b2 | 2012-03-06 22:14:17 -0800 | [diff] [blame] | 308 | branch->target = target; |
| 309 | return branch; |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 310 | } |
| 311 | |
| 312 | LIR* opCmpImmBranch(CompilationUnit* cUnit, ConditionCode cond, int reg, |
| 313 | int checkValue, LIR* target) |
| 314 | { |
Ian Rogers | 2e9f7ed | 2012-09-26 11:30:43 -0700 | [diff] [blame] | 315 | if ((checkValue == 0) && (cond == kCondEq || cond == kCondNe)) { |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 316 | // TODO: when checkValue == 0 and reg is rCX, use the jcxz/nz opcode |
Ian Rogers | 2e9f7ed | 2012-09-26 11:30:43 -0700 | [diff] [blame] | 317 | newLIR2(cUnit, kX86Test32RR, reg, reg); |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 318 | } else { |
Ian Rogers | 2e9f7ed | 2012-09-26 11:30:43 -0700 | [diff] [blame] | 319 | newLIR2(cUnit, IS_SIMM8(checkValue) ? kX86Cmp32RI8 : kX86Cmp32RI, reg, checkValue); |
Ian Rogers | 7caad77 | 2012-03-30 01:07:54 -0700 | [diff] [blame] | 320 | } |
Ian Rogers | b5d09b2 | 2012-03-06 22:14:17 -0800 | [diff] [blame] | 321 | X86ConditionCode cc = oatX86ConditionEncoding(cond); |
Ian Rogers | b41b33b | 2012-03-20 14:22:54 -0700 | [diff] [blame] | 322 | LIR* branch = newLIR2(cUnit, kX86Jcc8, 0 /* lir operand for Jcc offset */ , cc); |
Ian Rogers | b5d09b2 | 2012-03-06 22:14:17 -0800 | [diff] [blame] | 323 | branch->target = target; |
| 324 | return branch; |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 325 | } |
| 326 | |
| 327 | LIR* opRegCopyNoInsert(CompilationUnit *cUnit, int rDest, int rSrc) |
| 328 | { |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 329 | if (FPREG(rDest) || FPREG(rSrc)) |
| 330 | return fpRegCopy(cUnit, rDest, rSrc); |
| 331 | LIR* res = rawLIR(cUnit, cUnit->currentDalvikOffset, kX86Mov32RR, |
| 332 | rDest, rSrc); |
| 333 | if (rDest == rSrc) { |
| 334 | res->flags.isNop = true; |
| 335 | } |
| 336 | return res; |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 337 | } |
| 338 | |
| 339 | LIR* opRegCopy(CompilationUnit *cUnit, int rDest, int rSrc) |
| 340 | { |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 341 | LIR *res = opRegCopyNoInsert(cUnit, rDest, rSrc); |
| 342 | oatAppendLIR(cUnit, res); |
| 343 | return res; |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 344 | } |
| 345 | |
| 346 | void opRegCopyWide(CompilationUnit *cUnit, int destLo, int destHi, |
Bill Buzbee | a114add | 2012-05-03 15:00:40 -0700 | [diff] [blame] | 347 | int srcLo, int srcHi) |
| 348 | { |
Ian Rogers | f7d9ad3 | 2012-03-13 18:45:39 -0700 | [diff] [blame] | 349 | bool destFP = FPREG(destLo) && FPREG(destHi); |
| 350 | bool srcFP = FPREG(srcLo) && FPREG(srcHi); |
| 351 | assert(FPREG(srcLo) == FPREG(srcHi)); |
| 352 | assert(FPREG(destLo) == FPREG(destHi)); |
Ian Rogers | f7d9ad3 | 2012-03-13 18:45:39 -0700 | [diff] [blame] | 353 | if (destFP) { |
| 354 | if (srcFP) { |
| 355 | opRegCopy(cUnit, S2D(destLo, destHi), S2D(srcLo, srcHi)); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 356 | } else { |
jeffhao | fdffdf8 | 2012-07-11 16:08:43 -0700 | [diff] [blame] | 357 | // TODO: Prevent this from happening in the code. The result is often |
| 358 | // unused or could have been loaded more easily from memory. |
| 359 | newLIR2(cUnit, kX86MovdxrRR, destLo, srcLo); |
| 360 | newLIR2(cUnit, kX86MovdxrRR, destHi, srcHi); |
| 361 | newLIR2(cUnit, kX86PsllqRI, destHi, 32); |
| 362 | newLIR2(cUnit, kX86OrpsRR, destLo, destHi); |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 363 | } |
Ian Rogers | f7d9ad3 | 2012-03-13 18:45:39 -0700 | [diff] [blame] | 364 | } else { |
| 365 | if (srcFP) { |
jeffhao | fdffdf8 | 2012-07-11 16:08:43 -0700 | [diff] [blame] | 366 | newLIR2(cUnit, kX86MovdrxRR, destLo, srcLo); |
| 367 | newLIR2(cUnit, kX86PsrlqRI, srcLo, 32); |
| 368 | newLIR2(cUnit, kX86MovdrxRR, destHi, srcLo); |
Ian Rogers | f7d9ad3 | 2012-03-13 18:45:39 -0700 | [diff] [blame] | 369 | } else { |
| 370 | // Handle overlap |
| 371 | if (srcHi == destLo) { |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 372 | opRegCopy(cUnit, destHi, srcHi); |
| 373 | opRegCopy(cUnit, destLo, srcLo); |
Ian Rogers | f7d9ad3 | 2012-03-13 18:45:39 -0700 | [diff] [blame] | 374 | } else { |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 375 | opRegCopy(cUnit, destLo, srcLo); |
| 376 | opRegCopy(cUnit, destHi, srcHi); |
Ian Rogers | f7d9ad3 | 2012-03-13 18:45:39 -0700 | [diff] [blame] | 377 | } |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 378 | } |
Ian Rogers | f7d9ad3 | 2012-03-13 18:45:39 -0700 | [diff] [blame] | 379 | } |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 380 | } |
| 381 | |
jeffhao | 4b771a0 | 2012-07-25 15:07:21 -0700 | [diff] [blame] | 382 | void genFusedLongCmpBranch(CompilationUnit* cUnit, BasicBlock* bb, MIR* mir) { |
| 383 | LIR* labelList = cUnit->blockLabelList; |
| 384 | LIR* taken = &labelList[bb->taken->id]; |
| 385 | RegLocation rlSrc1 = oatGetSrcWide(cUnit, mir, 0); |
| 386 | RegLocation rlSrc2 = oatGetSrcWide(cUnit, mir, 2); |
| 387 | oatFlushAllRegs(cUnit); |
| 388 | oatLockCallTemps(cUnit); // Prepare for explicit register usage |
| 389 | loadValueDirectWideFixed(cUnit, rlSrc1, r0, r1); |
| 390 | loadValueDirectWideFixed(cUnit, rlSrc2, r2, r3); |
| 391 | ConditionCode ccode = static_cast<ConditionCode>(mir->dalvikInsn.arg[0]); |
| 392 | // Swap operands and condition code to prevent use of zero flag. |
| 393 | if (ccode == kCondLe || ccode == kCondGt) { |
| 394 | // Compute (r3:r2) = (r3:r2) - (r1:r0) |
| 395 | opRegReg(cUnit, kOpSub, r2, r0); // r2 = r2 - r0 |
| 396 | opRegReg(cUnit, kOpSbc, r3, r1); // r3 = r3 - r1 - CF |
| 397 | } else { |
| 398 | // Compute (r1:r0) = (r1:r0) - (r3:r2) |
| 399 | opRegReg(cUnit, kOpSub, r0, r2); // r0 = r0 - r2 |
| 400 | opRegReg(cUnit, kOpSbc, r1, r3); // r1 = r1 - r3 - CF |
| 401 | } |
| 402 | switch (ccode) { |
| 403 | case kCondEq: |
| 404 | case kCondNe: |
| 405 | opRegReg(cUnit, kOpOr, r0, r1); // r0 = r0 | r1 |
| 406 | break; |
| 407 | case kCondLe: |
| 408 | ccode = kCondGe; |
| 409 | break; |
| 410 | case kCondGt: |
| 411 | ccode = kCondLt; |
| 412 | break; |
| 413 | case kCondLt: |
| 414 | case kCondGe: |
| 415 | break; |
| 416 | default: |
| 417 | LOG(FATAL) << "Unexpected ccode: " << (int)ccode; |
| 418 | } |
| 419 | opCondBranch(cUnit, ccode, taken); |
| 420 | } |
| 421 | |
buzbee | e88dfbf | 2012-03-05 11:19:57 -0800 | [diff] [blame] | 422 | } // namespace art |