blob: 5e97a50d509913b12c926662341abcc51e9c4cb0 [file] [log] [blame]
buzbeee88dfbf2012-03-05 11:19:57 -08001/*
2 * Copyright (C) 2012 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17namespace art {
18
buzbee408ad162012-06-06 16:45:18 -070019static bool genArithOpFloat(CompilationUnit *cUnit, Instruction::Code opcode,
Bill Buzbeea114add2012-05-03 15:00:40 -070020 RegLocation rlDest, RegLocation rlSrc1,
21 RegLocation rlSrc2) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080022 X86OpCode op = kX86Nop;
23 RegLocation rlResult;
buzbeee88dfbf2012-03-05 11:19:57 -080024
Ian Rogersb5d09b22012-03-06 22:14:17 -080025 /*
26 * Don't attempt to optimize register usage since these opcodes call out to
27 * the handlers.
28 */
buzbee408ad162012-06-06 16:45:18 -070029 switch (opcode) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080030 case Instruction::ADD_FLOAT_2ADDR:
31 case Instruction::ADD_FLOAT:
32 op = kX86AddssRR;
33 break;
34 case Instruction::SUB_FLOAT_2ADDR:
35 case Instruction::SUB_FLOAT:
36 op = kX86SubssRR;
37 break;
38 case Instruction::DIV_FLOAT_2ADDR:
39 case Instruction::DIV_FLOAT:
40 op = kX86DivssRR;
41 break;
42 case Instruction::MUL_FLOAT_2ADDR:
43 case Instruction::MUL_FLOAT:
44 op = kX86MulssRR;
45 break;
jeffhaobabda952012-08-02 15:55:30 -070046 case Instruction::NEG_FLOAT:
Ian Rogersb5d09b22012-03-06 22:14:17 -080047 case Instruction::REM_FLOAT_2ADDR:
jeffhaobabda952012-08-02 15:55:30 -070048 case Instruction::REM_FLOAT:
buzbee408ad162012-06-06 16:45:18 -070049 return genArithOpFloatPortable(cUnit, opcode, rlDest, rlSrc1, rlSrc2);
Ian Rogersb5d09b22012-03-06 22:14:17 -080050 default:
51 return true;
52 }
53 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
54 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
55 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
56 int rDest = rlResult.lowReg;
57 int rSrc1 = rlSrc1.lowReg;
58 int rSrc2 = rlSrc2.lowReg;
jeffhao573b4292012-07-30 16:37:41 -070059 if (rDest == rSrc2) {
jeffhao4abb1a92012-06-08 17:02:08 -070060 rSrc2 = oatAllocTempFloat(cUnit);
61 opRegCopy(cUnit, rSrc2, rDest);
62 }
Ian Rogersb5d09b22012-03-06 22:14:17 -080063 opRegCopy(cUnit, rDest, rSrc1);
64 newLIR2(cUnit, op, rDest, rSrc2);
65 storeValue(cUnit, rlDest, rlResult);
buzbeee88dfbf2012-03-05 11:19:57 -080066
Ian Rogersb5d09b22012-03-06 22:14:17 -080067 return false;
buzbeee88dfbf2012-03-05 11:19:57 -080068}
69
buzbee408ad162012-06-06 16:45:18 -070070static bool genArithOpDouble(CompilationUnit *cUnit, Instruction::Code opcode,
buzbeee88dfbf2012-03-05 11:19:57 -080071 RegLocation rlDest, RegLocation rlSrc1,
Ian Rogersb5d09b22012-03-06 22:14:17 -080072 RegLocation rlSrc2) {
73 X86OpCode op = kX86Nop;
74 RegLocation rlResult;
buzbeee88dfbf2012-03-05 11:19:57 -080075
buzbee408ad162012-06-06 16:45:18 -070076 switch (opcode) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080077 case Instruction::ADD_DOUBLE_2ADDR:
78 case Instruction::ADD_DOUBLE:
79 op = kX86AddsdRR;
80 break;
81 case Instruction::SUB_DOUBLE_2ADDR:
82 case Instruction::SUB_DOUBLE:
83 op = kX86SubsdRR;
84 break;
85 case Instruction::DIV_DOUBLE_2ADDR:
86 case Instruction::DIV_DOUBLE:
87 op = kX86DivsdRR;
88 break;
89 case Instruction::MUL_DOUBLE_2ADDR:
90 case Instruction::MUL_DOUBLE:
91 op = kX86MulsdRR;
92 break;
jeffhaobabda952012-08-02 15:55:30 -070093 case Instruction::NEG_DOUBLE:
Ian Rogersb5d09b22012-03-06 22:14:17 -080094 case Instruction::REM_DOUBLE_2ADDR:
jeffhaobabda952012-08-02 15:55:30 -070095 case Instruction::REM_DOUBLE:
buzbee408ad162012-06-06 16:45:18 -070096 return genArithOpDoublePortable(cUnit, opcode, rlDest, rlSrc1, rlSrc2);
Ian Rogersb5d09b22012-03-06 22:14:17 -080097 default:
98 return true;
99 }
100 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
101 DCHECK(rlSrc1.wide);
102 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
103 DCHECK(rlSrc2.wide);
104 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
105 DCHECK(rlDest.wide);
106 DCHECK(rlResult.wide);
buzbeef0504cd2012-11-13 16:31:10 -0800107 int rDest = s2d(rlResult.lowReg, rlResult.highReg);
108 int rSrc1 = s2d(rlSrc1.lowReg, rlSrc1.highReg);
109 int rSrc2 = s2d(rlSrc2.lowReg, rlSrc2.highReg);
jeffhao4abb1a92012-06-08 17:02:08 -0700110 if (rDest == rSrc2) {
buzbeef0504cd2012-11-13 16:31:10 -0800111 rSrc2 = oatAllocTempDouble(cUnit) | X86_FP_DOUBLE;
jeffhao4abb1a92012-06-08 17:02:08 -0700112 opRegCopy(cUnit, rSrc2, rDest);
113 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800114 opRegCopy(cUnit, rDest, rSrc1);
115 newLIR2(cUnit, op, rDest, rSrc2);
116 storeValueWide(cUnit, rlDest, rlResult);
117 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800118}
119
buzbee408ad162012-06-06 16:45:18 -0700120static bool genConversion(CompilationUnit *cUnit, Instruction::Code opcode,
121 RegLocation rlDest, RegLocation rlSrc) {
jeffhao5121e0b2012-05-08 18:23:38 -0700122 RegisterClass rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800123 X86OpCode op = kX86Nop;
124 int srcReg;
125 RegLocation rlResult;
126 switch (opcode) {
127 case Instruction::INT_TO_FLOAT:
jeffhao5121e0b2012-05-08 18:23:38 -0700128 rcSrc = kCoreReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800129 op = kX86Cvtsi2ssRR;
130 break;
131 case Instruction::DOUBLE_TO_FLOAT:
jeffhao5121e0b2012-05-08 18:23:38 -0700132 rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800133 op = kX86Cvtsd2ssRR;
134 break;
135 case Instruction::FLOAT_TO_DOUBLE:
jeffhao5121e0b2012-05-08 18:23:38 -0700136 rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800137 op = kX86Cvtss2sdRR;
138 break;
139 case Instruction::INT_TO_DOUBLE:
jeffhao5121e0b2012-05-08 18:23:38 -0700140 rcSrc = kCoreReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800141 op = kX86Cvtsi2sdRR;
142 break;
jeffhao292188d2012-05-17 15:45:04 -0700143 case Instruction::FLOAT_TO_INT: {
jeffhao41005dd2012-05-09 17:58:52 -0700144 rlSrc = loadValue(cUnit, rlSrc, kFPReg);
145 srcReg = rlSrc.lowReg;
jeffhao41005dd2012-05-09 17:58:52 -0700146 oatClobberSReg(cUnit, rlDest.sRegLow);
147 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
jeffhao292188d2012-05-17 15:45:04 -0700148 int tempReg = oatAllocTempFloat(cUnit);
jeffhao41005dd2012-05-09 17:58:52 -0700149
150 loadConstant(cUnit, rlResult.lowReg, 0x7fffffff);
151 newLIR2(cUnit, kX86Cvtsi2ssRR, tempReg, rlResult.lowReg);
152 newLIR2(cUnit, kX86ComissRR, srcReg, tempReg);
jeffhao292188d2012-05-17 15:45:04 -0700153 LIR* branchPosOverflow = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
154 LIR* branchNaN = newLIR2(cUnit, kX86Jcc8, 0, kX86CondP);
155 newLIR2(cUnit, kX86Cvttss2siRR, rlResult.lowReg, srcReg);
156 LIR* branchNormal = newLIR1(cUnit, kX86Jmp8, 0);
157 branchNaN->target = newLIR0(cUnit, kPseudoTargetLabel);
158 newLIR2(cUnit, kX86Xor32RR, rlResult.lowReg, rlResult.lowReg);
159 branchPosOverflow->target = newLIR0(cUnit, kPseudoTargetLabel);
160 branchNormal->target = newLIR0(cUnit, kPseudoTargetLabel);
jeffhao41005dd2012-05-09 17:58:52 -0700161 storeValue(cUnit, rlDest, rlResult);
162 return false;
jeffhao292188d2012-05-17 15:45:04 -0700163 }
164 case Instruction::DOUBLE_TO_INT: {
jeffhao41005dd2012-05-09 17:58:52 -0700165 rlSrc = loadValueWide(cUnit, rlSrc, kFPReg);
166 srcReg = rlSrc.lowReg;
jeffhao41005dd2012-05-09 17:58:52 -0700167 oatClobberSReg(cUnit, rlDest.sRegLow);
168 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
buzbeef0504cd2012-11-13 16:31:10 -0800169 int tempReg = oatAllocTempDouble(cUnit) | X86_FP_DOUBLE;
jeffhao41005dd2012-05-09 17:58:52 -0700170
171 loadConstant(cUnit, rlResult.lowReg, 0x7fffffff);
172 newLIR2(cUnit, kX86Cvtsi2sdRR, tempReg, rlResult.lowReg);
173 newLIR2(cUnit, kX86ComisdRR, srcReg, tempReg);
jeffhao292188d2012-05-17 15:45:04 -0700174 LIR* branchPosOverflow = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
175 LIR* branchNaN = newLIR2(cUnit, kX86Jcc8, 0, kX86CondP);
176 newLIR2(cUnit, kX86Cvttsd2siRR, rlResult.lowReg, srcReg);
177 LIR* branchNormal = newLIR1(cUnit, kX86Jmp8, 0);
178 branchNaN->target = newLIR0(cUnit, kPseudoTargetLabel);
179 newLIR2(cUnit, kX86Xor32RR, rlResult.lowReg, rlResult.lowReg);
180 branchPosOverflow->target = newLIR0(cUnit, kPseudoTargetLabel);
181 branchNormal->target = newLIR0(cUnit, kPseudoTargetLabel);
jeffhao41005dd2012-05-09 17:58:52 -0700182 storeValue(cUnit, rlDest, rlResult);
183 return false;
jeffhao292188d2012-05-17 15:45:04 -0700184 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800185 case Instruction::LONG_TO_DOUBLE:
Ian Rogersb5d09b22012-03-06 22:14:17 -0800186 case Instruction::LONG_TO_FLOAT:
jeffhaobabda952012-08-02 15:55:30 -0700187 // TODO: inline by using memory as a 64-bit source. Be careful about promoted registers.
jeffhao41005dd2012-05-09 17:58:52 -0700188 case Instruction::FLOAT_TO_LONG:
Ian Rogersb5d09b22012-03-06 22:14:17 -0800189 case Instruction::DOUBLE_TO_LONG:
buzbee408ad162012-06-06 16:45:18 -0700190 return genConversionPortable(cUnit, opcode, rlDest, rlSrc);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800191 default:
192 return true;
193 }
buzbee408ad162012-06-06 16:45:18 -0700194 if (rlSrc.wide) {
jeffhao5121e0b2012-05-08 18:23:38 -0700195 rlSrc = loadValueWide(cUnit, rlSrc, rcSrc);
buzbeef0504cd2012-11-13 16:31:10 -0800196 srcReg = s2d(rlSrc.lowReg, rlSrc.highReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800197 } else {
jeffhao5121e0b2012-05-08 18:23:38 -0700198 rlSrc = loadValue(cUnit, rlSrc, rcSrc);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800199 srcReg = rlSrc.lowReg;
200 }
buzbee408ad162012-06-06 16:45:18 -0700201 if (rlDest.wide) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800202 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
buzbeef0504cd2012-11-13 16:31:10 -0800203 newLIR2(cUnit, op, s2d(rlResult.lowReg, rlResult.highReg), srcReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800204 storeValueWide(cUnit, rlDest, rlResult);
205 } else {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800206 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
207 newLIR2(cUnit, op, rlResult.lowReg, srcReg);
208 storeValue(cUnit, rlDest, rlResult);
209 }
210 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800211}
212
buzbee408ad162012-06-06 16:45:18 -0700213static bool genCmpFP(CompilationUnit *cUnit, Instruction::Code code, RegLocation rlDest,
Ian Rogersb5d09b22012-03-06 22:14:17 -0800214 RegLocation rlSrc1, RegLocation rlSrc2) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800215 bool single = (code == Instruction::CMPL_FLOAT) || (code == Instruction::CMPG_FLOAT);
216 bool unorderedGt = (code == Instruction::CMPG_DOUBLE) || (code == Instruction::CMPG_FLOAT);
217 int srcReg1;
218 int srcReg2;
219 if (single) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800220 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
221 srcReg1 = rlSrc1.lowReg;
jeffhao644d5312012-05-03 19:04:49 -0700222 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
223 srcReg2 = rlSrc2.lowReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800224 } else {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800225 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
buzbeef0504cd2012-11-13 16:31:10 -0800226 srcReg1 = s2d(rlSrc1.lowReg, rlSrc1.highReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800227 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
buzbeef0504cd2012-11-13 16:31:10 -0800228 srcReg2 = s2d(rlSrc2.lowReg, rlSrc2.highReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800229 }
jeffhao41005dd2012-05-09 17:58:52 -0700230 oatClobberSReg(cUnit, rlDest.sRegLow);
Ian Rogersc6f3bb82012-03-21 20:40:33 -0700231 RegLocation rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
232 loadConstantNoClobber(cUnit, rlResult.lowReg, unorderedGt ? 1 : 0);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800233 if (single) {
234 newLIR2(cUnit, kX86UcomissRR, srcReg1, srcReg2);
235 } else {
236 newLIR2(cUnit, kX86UcomisdRR, srcReg1, srcReg2);
237 }
238 LIR* branch = NULL;
239 if (unorderedGt) {
Ian Rogersb41b33b2012-03-20 14:22:54 -0700240 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800241 }
jeffhao703f2cd2012-07-13 17:25:52 -0700242 // If the result reg can't be byte accessed, use a jump and move instead of a set.
243 if (rlResult.lowReg >= 4) {
244 LIR* branch2 = NULL;
245 if (unorderedGt) {
246 branch2 = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
247 newLIR2(cUnit, kX86Mov32RI, rlResult.lowReg, 0x0);
248 } else {
249 branch2 = newLIR2(cUnit, kX86Jcc8, 0, kX86CondBe);
250 newLIR2(cUnit, kX86Mov32RI, rlResult.lowReg, 0x1);
251 }
252 branch2->target = newLIR0(cUnit, kPseudoTargetLabel);
253 } else {
254 newLIR2(cUnit, kX86Set8R, rlResult.lowReg, kX86CondA /* above - unsigned > */);
255 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800256 newLIR2(cUnit, kX86Sbb32RI, rlResult.lowReg, 0);
257 if (unorderedGt) {
258 branch->target = newLIR0(cUnit, kPseudoTargetLabel);
259 }
jeffhao644d5312012-05-03 19:04:49 -0700260 storeValue(cUnit, rlDest, rlResult);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800261 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800262}
263
jeffhao4b771a02012-07-25 15:07:21 -0700264void genFusedFPCmpBranch(CompilationUnit* cUnit, BasicBlock* bb, MIR* mir,
265 bool gtBias, bool isDouble) {
266 LIR* labelList = cUnit->blockLabelList;
267 LIR* taken = &labelList[bb->taken->id];
268 LIR* notTaken = &labelList[bb->fallThrough->id];
269 LIR* branch = NULL;
270 RegLocation rlSrc1;
271 RegLocation rlSrc2;
272 if (isDouble) {
273 rlSrc1 = oatGetSrcWide(cUnit, mir, 0);
274 rlSrc2 = oatGetSrcWide(cUnit, mir, 2);
275 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
276 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
buzbeef0504cd2012-11-13 16:31:10 -0800277 newLIR2(cUnit, kX86UcomisdRR, s2d(rlSrc1.lowReg, rlSrc1.highReg),
278 s2d(rlSrc2.lowReg, rlSrc2.highReg));
jeffhao4b771a02012-07-25 15:07:21 -0700279 } else {
280 rlSrc1 = oatGetSrc(cUnit, mir, 0);
281 rlSrc2 = oatGetSrc(cUnit, mir, 1);
282 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
283 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
284 newLIR2(cUnit, kX86UcomissRR, rlSrc1.lowReg, rlSrc2.lowReg);
285 }
286 ConditionCode ccode = static_cast<ConditionCode>(mir->dalvikInsn.arg[0]);
287 switch (ccode) {
288 case kCondEq:
jeffhao0e3ac142012-08-03 18:24:38 -0700289 if (!gtBias) {
jeffhao4b771a02012-07-25 15:07:21 -0700290 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
291 branch->target = notTaken;
292 }
293 break;
294 case kCondNe:
295 if (!gtBias) {
296 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
297 branch->target = taken;
298 }
299 break;
300 case kCondLt:
301 if (gtBias) {
302 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
303 branch->target = notTaken;
304 }
305 ccode = kCondCs;
306 break;
307 case kCondLe:
308 if (gtBias) {
309 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
310 branch->target = notTaken;
311 }
312 ccode = kCondLs;
313 break;
314 case kCondGt:
315 if (gtBias) {
316 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
317 branch->target = taken;
318 }
319 ccode = kCondHi;
320 break;
321 case kCondGe:
322 if (gtBias) {
323 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
324 branch->target = taken;
325 }
326 ccode = kCondCc;
327 break;
328 default:
329 LOG(FATAL) << "Unexpected ccode: " << (int)ccode;
330 }
331 opCondBranch(cUnit, ccode, taken);
332}
333
buzbeee88dfbf2012-03-05 11:19:57 -0800334} // namespace art