blob: 411bd1e381c5b5ffd38496afb8948a012f0333ba [file] [log] [blame]
buzbeee88dfbf2012-03-05 11:19:57 -08001/*
2 * Copyright (C) 2012 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17namespace art {
18
buzbeeeaf09bc2012-11-15 14:51:41 -080019bool genArithOpFloat(CompilationUnit *cUnit, Instruction::Code opcode,
20 RegLocation rlDest, RegLocation rlSrc1, RegLocation rlSrc2) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080021 X86OpCode op = kX86Nop;
22 RegLocation rlResult;
buzbeee88dfbf2012-03-05 11:19:57 -080023
Ian Rogersb5d09b22012-03-06 22:14:17 -080024 /*
25 * Don't attempt to optimize register usage since these opcodes call out to
26 * the handlers.
27 */
buzbee408ad162012-06-06 16:45:18 -070028 switch (opcode) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080029 case Instruction::ADD_FLOAT_2ADDR:
30 case Instruction::ADD_FLOAT:
31 op = kX86AddssRR;
32 break;
33 case Instruction::SUB_FLOAT_2ADDR:
34 case Instruction::SUB_FLOAT:
35 op = kX86SubssRR;
36 break;
37 case Instruction::DIV_FLOAT_2ADDR:
38 case Instruction::DIV_FLOAT:
39 op = kX86DivssRR;
40 break;
41 case Instruction::MUL_FLOAT_2ADDR:
42 case Instruction::MUL_FLOAT:
43 op = kX86MulssRR;
44 break;
jeffhaobabda952012-08-02 15:55:30 -070045 case Instruction::NEG_FLOAT:
Ian Rogersb5d09b22012-03-06 22:14:17 -080046 case Instruction::REM_FLOAT_2ADDR:
jeffhaobabda952012-08-02 15:55:30 -070047 case Instruction::REM_FLOAT:
buzbee408ad162012-06-06 16:45:18 -070048 return genArithOpFloatPortable(cUnit, opcode, rlDest, rlSrc1, rlSrc2);
Ian Rogersb5d09b22012-03-06 22:14:17 -080049 default:
50 return true;
51 }
52 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
53 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
54 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
55 int rDest = rlResult.lowReg;
56 int rSrc1 = rlSrc1.lowReg;
57 int rSrc2 = rlSrc2.lowReg;
jeffhao573b4292012-07-30 16:37:41 -070058 if (rDest == rSrc2) {
jeffhao4abb1a92012-06-08 17:02:08 -070059 rSrc2 = oatAllocTempFloat(cUnit);
60 opRegCopy(cUnit, rSrc2, rDest);
61 }
Ian Rogersb5d09b22012-03-06 22:14:17 -080062 opRegCopy(cUnit, rDest, rSrc1);
63 newLIR2(cUnit, op, rDest, rSrc2);
64 storeValue(cUnit, rlDest, rlResult);
buzbeee88dfbf2012-03-05 11:19:57 -080065
Ian Rogersb5d09b22012-03-06 22:14:17 -080066 return false;
buzbeee88dfbf2012-03-05 11:19:57 -080067}
68
buzbeeeaf09bc2012-11-15 14:51:41 -080069bool genArithOpDouble(CompilationUnit *cUnit, Instruction::Code opcode,
70 RegLocation rlDest, RegLocation rlSrc1, RegLocation rlSrc2) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080071 X86OpCode op = kX86Nop;
72 RegLocation rlResult;
buzbeee88dfbf2012-03-05 11:19:57 -080073
buzbee408ad162012-06-06 16:45:18 -070074 switch (opcode) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080075 case Instruction::ADD_DOUBLE_2ADDR:
76 case Instruction::ADD_DOUBLE:
77 op = kX86AddsdRR;
78 break;
79 case Instruction::SUB_DOUBLE_2ADDR:
80 case Instruction::SUB_DOUBLE:
81 op = kX86SubsdRR;
82 break;
83 case Instruction::DIV_DOUBLE_2ADDR:
84 case Instruction::DIV_DOUBLE:
85 op = kX86DivsdRR;
86 break;
87 case Instruction::MUL_DOUBLE_2ADDR:
88 case Instruction::MUL_DOUBLE:
89 op = kX86MulsdRR;
90 break;
jeffhaobabda952012-08-02 15:55:30 -070091 case Instruction::NEG_DOUBLE:
Ian Rogersb5d09b22012-03-06 22:14:17 -080092 case Instruction::REM_DOUBLE_2ADDR:
jeffhaobabda952012-08-02 15:55:30 -070093 case Instruction::REM_DOUBLE:
buzbee408ad162012-06-06 16:45:18 -070094 return genArithOpDoublePortable(cUnit, opcode, rlDest, rlSrc1, rlSrc2);
Ian Rogersb5d09b22012-03-06 22:14:17 -080095 default:
96 return true;
97 }
98 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
99 DCHECK(rlSrc1.wide);
100 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
101 DCHECK(rlSrc2.wide);
102 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
103 DCHECK(rlDest.wide);
104 DCHECK(rlResult.wide);
buzbeef0504cd2012-11-13 16:31:10 -0800105 int rDest = s2d(rlResult.lowReg, rlResult.highReg);
106 int rSrc1 = s2d(rlSrc1.lowReg, rlSrc1.highReg);
107 int rSrc2 = s2d(rlSrc2.lowReg, rlSrc2.highReg);
jeffhao4abb1a92012-06-08 17:02:08 -0700108 if (rDest == rSrc2) {
buzbeef0504cd2012-11-13 16:31:10 -0800109 rSrc2 = oatAllocTempDouble(cUnit) | X86_FP_DOUBLE;
jeffhao4abb1a92012-06-08 17:02:08 -0700110 opRegCopy(cUnit, rSrc2, rDest);
111 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800112 opRegCopy(cUnit, rDest, rSrc1);
113 newLIR2(cUnit, op, rDest, rSrc2);
114 storeValueWide(cUnit, rlDest, rlResult);
115 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800116}
117
buzbeeeaf09bc2012-11-15 14:51:41 -0800118bool genConversion(CompilationUnit *cUnit, Instruction::Code opcode,
119 RegLocation rlDest, RegLocation rlSrc) {
jeffhao5121e0b2012-05-08 18:23:38 -0700120 RegisterClass rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800121 X86OpCode op = kX86Nop;
122 int srcReg;
123 RegLocation rlResult;
124 switch (opcode) {
125 case Instruction::INT_TO_FLOAT:
jeffhao5121e0b2012-05-08 18:23:38 -0700126 rcSrc = kCoreReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800127 op = kX86Cvtsi2ssRR;
128 break;
129 case Instruction::DOUBLE_TO_FLOAT:
jeffhao5121e0b2012-05-08 18:23:38 -0700130 rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800131 op = kX86Cvtsd2ssRR;
132 break;
133 case Instruction::FLOAT_TO_DOUBLE:
jeffhao5121e0b2012-05-08 18:23:38 -0700134 rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800135 op = kX86Cvtss2sdRR;
136 break;
137 case Instruction::INT_TO_DOUBLE:
jeffhao5121e0b2012-05-08 18:23:38 -0700138 rcSrc = kCoreReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800139 op = kX86Cvtsi2sdRR;
140 break;
jeffhao292188d2012-05-17 15:45:04 -0700141 case Instruction::FLOAT_TO_INT: {
jeffhao41005dd2012-05-09 17:58:52 -0700142 rlSrc = loadValue(cUnit, rlSrc, kFPReg);
143 srcReg = rlSrc.lowReg;
jeffhao41005dd2012-05-09 17:58:52 -0700144 oatClobberSReg(cUnit, rlDest.sRegLow);
145 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
jeffhao292188d2012-05-17 15:45:04 -0700146 int tempReg = oatAllocTempFloat(cUnit);
jeffhao41005dd2012-05-09 17:58:52 -0700147
148 loadConstant(cUnit, rlResult.lowReg, 0x7fffffff);
149 newLIR2(cUnit, kX86Cvtsi2ssRR, tempReg, rlResult.lowReg);
150 newLIR2(cUnit, kX86ComissRR, srcReg, tempReg);
jeffhao292188d2012-05-17 15:45:04 -0700151 LIR* branchPosOverflow = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
152 LIR* branchNaN = newLIR2(cUnit, kX86Jcc8, 0, kX86CondP);
153 newLIR2(cUnit, kX86Cvttss2siRR, rlResult.lowReg, srcReg);
154 LIR* branchNormal = newLIR1(cUnit, kX86Jmp8, 0);
155 branchNaN->target = newLIR0(cUnit, kPseudoTargetLabel);
156 newLIR2(cUnit, kX86Xor32RR, rlResult.lowReg, rlResult.lowReg);
157 branchPosOverflow->target = newLIR0(cUnit, kPseudoTargetLabel);
158 branchNormal->target = newLIR0(cUnit, kPseudoTargetLabel);
jeffhao41005dd2012-05-09 17:58:52 -0700159 storeValue(cUnit, rlDest, rlResult);
160 return false;
jeffhao292188d2012-05-17 15:45:04 -0700161 }
162 case Instruction::DOUBLE_TO_INT: {
jeffhao41005dd2012-05-09 17:58:52 -0700163 rlSrc = loadValueWide(cUnit, rlSrc, kFPReg);
164 srcReg = rlSrc.lowReg;
jeffhao41005dd2012-05-09 17:58:52 -0700165 oatClobberSReg(cUnit, rlDest.sRegLow);
166 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
buzbeef0504cd2012-11-13 16:31:10 -0800167 int tempReg = oatAllocTempDouble(cUnit) | X86_FP_DOUBLE;
jeffhao41005dd2012-05-09 17:58:52 -0700168
169 loadConstant(cUnit, rlResult.lowReg, 0x7fffffff);
170 newLIR2(cUnit, kX86Cvtsi2sdRR, tempReg, rlResult.lowReg);
171 newLIR2(cUnit, kX86ComisdRR, srcReg, tempReg);
jeffhao292188d2012-05-17 15:45:04 -0700172 LIR* branchPosOverflow = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
173 LIR* branchNaN = newLIR2(cUnit, kX86Jcc8, 0, kX86CondP);
174 newLIR2(cUnit, kX86Cvttsd2siRR, rlResult.lowReg, srcReg);
175 LIR* branchNormal = newLIR1(cUnit, kX86Jmp8, 0);
176 branchNaN->target = newLIR0(cUnit, kPseudoTargetLabel);
177 newLIR2(cUnit, kX86Xor32RR, rlResult.lowReg, rlResult.lowReg);
178 branchPosOverflow->target = newLIR0(cUnit, kPseudoTargetLabel);
179 branchNormal->target = newLIR0(cUnit, kPseudoTargetLabel);
jeffhao41005dd2012-05-09 17:58:52 -0700180 storeValue(cUnit, rlDest, rlResult);
181 return false;
jeffhao292188d2012-05-17 15:45:04 -0700182 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800183 case Instruction::LONG_TO_DOUBLE:
Ian Rogersb5d09b22012-03-06 22:14:17 -0800184 case Instruction::LONG_TO_FLOAT:
jeffhaobabda952012-08-02 15:55:30 -0700185 // TODO: inline by using memory as a 64-bit source. Be careful about promoted registers.
jeffhao41005dd2012-05-09 17:58:52 -0700186 case Instruction::FLOAT_TO_LONG:
Ian Rogersb5d09b22012-03-06 22:14:17 -0800187 case Instruction::DOUBLE_TO_LONG:
buzbee408ad162012-06-06 16:45:18 -0700188 return genConversionPortable(cUnit, opcode, rlDest, rlSrc);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800189 default:
190 return true;
191 }
buzbee408ad162012-06-06 16:45:18 -0700192 if (rlSrc.wide) {
jeffhao5121e0b2012-05-08 18:23:38 -0700193 rlSrc = loadValueWide(cUnit, rlSrc, rcSrc);
buzbeef0504cd2012-11-13 16:31:10 -0800194 srcReg = s2d(rlSrc.lowReg, rlSrc.highReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800195 } else {
jeffhao5121e0b2012-05-08 18:23:38 -0700196 rlSrc = loadValue(cUnit, rlSrc, rcSrc);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800197 srcReg = rlSrc.lowReg;
198 }
buzbee408ad162012-06-06 16:45:18 -0700199 if (rlDest.wide) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800200 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
buzbeef0504cd2012-11-13 16:31:10 -0800201 newLIR2(cUnit, op, s2d(rlResult.lowReg, rlResult.highReg), srcReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800202 storeValueWide(cUnit, rlDest, rlResult);
203 } else {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800204 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
205 newLIR2(cUnit, op, rlResult.lowReg, srcReg);
206 storeValue(cUnit, rlDest, rlResult);
207 }
208 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800209}
210
buzbeeeaf09bc2012-11-15 14:51:41 -0800211bool genCmpFP(CompilationUnit *cUnit, Instruction::Code code, RegLocation rlDest,
212 RegLocation rlSrc1, RegLocation rlSrc2) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800213 bool single = (code == Instruction::CMPL_FLOAT) || (code == Instruction::CMPG_FLOAT);
214 bool unorderedGt = (code == Instruction::CMPG_DOUBLE) || (code == Instruction::CMPG_FLOAT);
215 int srcReg1;
216 int srcReg2;
217 if (single) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800218 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
219 srcReg1 = rlSrc1.lowReg;
jeffhao644d5312012-05-03 19:04:49 -0700220 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
221 srcReg2 = rlSrc2.lowReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800222 } else {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800223 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
buzbeef0504cd2012-11-13 16:31:10 -0800224 srcReg1 = s2d(rlSrc1.lowReg, rlSrc1.highReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800225 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
buzbeef0504cd2012-11-13 16:31:10 -0800226 srcReg2 = s2d(rlSrc2.lowReg, rlSrc2.highReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800227 }
jeffhao41005dd2012-05-09 17:58:52 -0700228 oatClobberSReg(cUnit, rlDest.sRegLow);
Ian Rogersc6f3bb82012-03-21 20:40:33 -0700229 RegLocation rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
230 loadConstantNoClobber(cUnit, rlResult.lowReg, unorderedGt ? 1 : 0);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800231 if (single) {
232 newLIR2(cUnit, kX86UcomissRR, srcReg1, srcReg2);
233 } else {
234 newLIR2(cUnit, kX86UcomisdRR, srcReg1, srcReg2);
235 }
236 LIR* branch = NULL;
237 if (unorderedGt) {
Ian Rogersb41b33b2012-03-20 14:22:54 -0700238 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800239 }
jeffhao703f2cd2012-07-13 17:25:52 -0700240 // If the result reg can't be byte accessed, use a jump and move instead of a set.
241 if (rlResult.lowReg >= 4) {
242 LIR* branch2 = NULL;
243 if (unorderedGt) {
244 branch2 = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
245 newLIR2(cUnit, kX86Mov32RI, rlResult.lowReg, 0x0);
246 } else {
247 branch2 = newLIR2(cUnit, kX86Jcc8, 0, kX86CondBe);
248 newLIR2(cUnit, kX86Mov32RI, rlResult.lowReg, 0x1);
249 }
250 branch2->target = newLIR0(cUnit, kPseudoTargetLabel);
251 } else {
252 newLIR2(cUnit, kX86Set8R, rlResult.lowReg, kX86CondA /* above - unsigned > */);
253 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800254 newLIR2(cUnit, kX86Sbb32RI, rlResult.lowReg, 0);
255 if (unorderedGt) {
256 branch->target = newLIR0(cUnit, kPseudoTargetLabel);
257 }
jeffhao644d5312012-05-03 19:04:49 -0700258 storeValue(cUnit, rlDest, rlResult);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800259 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800260}
261
jeffhao4b771a02012-07-25 15:07:21 -0700262void genFusedFPCmpBranch(CompilationUnit* cUnit, BasicBlock* bb, MIR* mir,
263 bool gtBias, bool isDouble) {
264 LIR* labelList = cUnit->blockLabelList;
265 LIR* taken = &labelList[bb->taken->id];
266 LIR* notTaken = &labelList[bb->fallThrough->id];
267 LIR* branch = NULL;
268 RegLocation rlSrc1;
269 RegLocation rlSrc2;
270 if (isDouble) {
271 rlSrc1 = oatGetSrcWide(cUnit, mir, 0);
272 rlSrc2 = oatGetSrcWide(cUnit, mir, 2);
273 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
274 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
buzbeef0504cd2012-11-13 16:31:10 -0800275 newLIR2(cUnit, kX86UcomisdRR, s2d(rlSrc1.lowReg, rlSrc1.highReg),
276 s2d(rlSrc2.lowReg, rlSrc2.highReg));
jeffhao4b771a02012-07-25 15:07:21 -0700277 } else {
278 rlSrc1 = oatGetSrc(cUnit, mir, 0);
279 rlSrc2 = oatGetSrc(cUnit, mir, 1);
280 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
281 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
282 newLIR2(cUnit, kX86UcomissRR, rlSrc1.lowReg, rlSrc2.lowReg);
283 }
284 ConditionCode ccode = static_cast<ConditionCode>(mir->dalvikInsn.arg[0]);
285 switch (ccode) {
286 case kCondEq:
jeffhao0e3ac142012-08-03 18:24:38 -0700287 if (!gtBias) {
jeffhao4b771a02012-07-25 15:07:21 -0700288 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
289 branch->target = notTaken;
290 }
291 break;
292 case kCondNe:
293 if (!gtBias) {
294 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
295 branch->target = taken;
296 }
297 break;
298 case kCondLt:
299 if (gtBias) {
300 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
301 branch->target = notTaken;
302 }
303 ccode = kCondCs;
304 break;
305 case kCondLe:
306 if (gtBias) {
307 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
308 branch->target = notTaken;
309 }
310 ccode = kCondLs;
311 break;
312 case kCondGt:
313 if (gtBias) {
314 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
315 branch->target = taken;
316 }
317 ccode = kCondHi;
318 break;
319 case kCondGe:
320 if (gtBias) {
321 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
322 branch->target = taken;
323 }
324 ccode = kCondCc;
325 break;
326 default:
327 LOG(FATAL) << "Unexpected ccode: " << (int)ccode;
328 }
329 opCondBranch(cUnit, ccode, taken);
330}
331
buzbeeefc63692012-11-14 16:31:52 -0800332void genNegFloat(CompilationUnit *cUnit, RegLocation rlDest, RegLocation rlSrc)
333{
334 RegLocation rlResult;
335 rlSrc = loadValue(cUnit, rlSrc, kCoreReg);
336 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
337 opRegRegImm(cUnit, kOpAdd, rlResult.lowReg, rlSrc.lowReg, 0x80000000);
338 storeValue(cUnit, rlDest, rlResult);
339}
340
341void genNegDouble(CompilationUnit *cUnit, RegLocation rlDest, RegLocation rlSrc)
342{
343 RegLocation rlResult;
344 rlSrc = loadValueWide(cUnit, rlSrc, kCoreReg);
345 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
346 opRegRegImm(cUnit, kOpAdd, rlResult.highReg, rlSrc.highReg, 0x80000000);
347 opRegCopy(cUnit, rlResult.lowReg, rlSrc.lowReg);
348 storeValueWide(cUnit, rlDest, rlResult);
349}
350
351bool genInlinedSqrt(CompilationUnit* cUnit, CallInfo* info) {
352 DCHECK_NE(cUnit->instructionSet, kThumb2);
353 return false;
354}
355
356
357
buzbeee88dfbf2012-03-05 11:19:57 -0800358} // namespace art