blob: 92190cc93db2bb23f679c5bcb28ab3c1e48700f0 [file] [log] [blame]
buzbeee88dfbf2012-03-05 11:19:57 -08001/*
2 * Copyright (C) 2012 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
buzbee1bc37c62012-11-20 13:35:41 -080017#include "x86_lir.h"
18#include "../codegen_util.h"
19#include "../ralloc_util.h"
20
buzbeee88dfbf2012-03-05 11:19:57 -080021namespace art {
22
buzbeeeaf09bc2012-11-15 14:51:41 -080023bool genArithOpFloat(CompilationUnit *cUnit, Instruction::Code opcode,
24 RegLocation rlDest, RegLocation rlSrc1, RegLocation rlSrc2) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080025 X86OpCode op = kX86Nop;
26 RegLocation rlResult;
buzbeee88dfbf2012-03-05 11:19:57 -080027
Ian Rogersb5d09b22012-03-06 22:14:17 -080028 /*
29 * Don't attempt to optimize register usage since these opcodes call out to
30 * the handlers.
31 */
buzbee408ad162012-06-06 16:45:18 -070032 switch (opcode) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080033 case Instruction::ADD_FLOAT_2ADDR:
34 case Instruction::ADD_FLOAT:
35 op = kX86AddssRR;
36 break;
37 case Instruction::SUB_FLOAT_2ADDR:
38 case Instruction::SUB_FLOAT:
39 op = kX86SubssRR;
40 break;
41 case Instruction::DIV_FLOAT_2ADDR:
42 case Instruction::DIV_FLOAT:
43 op = kX86DivssRR;
44 break;
45 case Instruction::MUL_FLOAT_2ADDR:
46 case Instruction::MUL_FLOAT:
47 op = kX86MulssRR;
48 break;
jeffhaobabda952012-08-02 15:55:30 -070049 case Instruction::NEG_FLOAT:
Ian Rogersb5d09b22012-03-06 22:14:17 -080050 case Instruction::REM_FLOAT_2ADDR:
jeffhaobabda952012-08-02 15:55:30 -070051 case Instruction::REM_FLOAT:
buzbee408ad162012-06-06 16:45:18 -070052 return genArithOpFloatPortable(cUnit, opcode, rlDest, rlSrc1, rlSrc2);
Ian Rogersb5d09b22012-03-06 22:14:17 -080053 default:
54 return true;
55 }
56 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
57 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
58 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
59 int rDest = rlResult.lowReg;
60 int rSrc1 = rlSrc1.lowReg;
61 int rSrc2 = rlSrc2.lowReg;
jeffhao573b4292012-07-30 16:37:41 -070062 if (rDest == rSrc2) {
jeffhao4abb1a92012-06-08 17:02:08 -070063 rSrc2 = oatAllocTempFloat(cUnit);
64 opRegCopy(cUnit, rSrc2, rDest);
65 }
Ian Rogersb5d09b22012-03-06 22:14:17 -080066 opRegCopy(cUnit, rDest, rSrc1);
67 newLIR2(cUnit, op, rDest, rSrc2);
68 storeValue(cUnit, rlDest, rlResult);
buzbeee88dfbf2012-03-05 11:19:57 -080069
Ian Rogersb5d09b22012-03-06 22:14:17 -080070 return false;
buzbeee88dfbf2012-03-05 11:19:57 -080071}
72
buzbeeeaf09bc2012-11-15 14:51:41 -080073bool genArithOpDouble(CompilationUnit *cUnit, Instruction::Code opcode,
74 RegLocation rlDest, RegLocation rlSrc1, RegLocation rlSrc2) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080075 X86OpCode op = kX86Nop;
76 RegLocation rlResult;
buzbeee88dfbf2012-03-05 11:19:57 -080077
buzbee408ad162012-06-06 16:45:18 -070078 switch (opcode) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080079 case Instruction::ADD_DOUBLE_2ADDR:
80 case Instruction::ADD_DOUBLE:
81 op = kX86AddsdRR;
82 break;
83 case Instruction::SUB_DOUBLE_2ADDR:
84 case Instruction::SUB_DOUBLE:
85 op = kX86SubsdRR;
86 break;
87 case Instruction::DIV_DOUBLE_2ADDR:
88 case Instruction::DIV_DOUBLE:
89 op = kX86DivsdRR;
90 break;
91 case Instruction::MUL_DOUBLE_2ADDR:
92 case Instruction::MUL_DOUBLE:
93 op = kX86MulsdRR;
94 break;
jeffhaobabda952012-08-02 15:55:30 -070095 case Instruction::NEG_DOUBLE:
Ian Rogersb5d09b22012-03-06 22:14:17 -080096 case Instruction::REM_DOUBLE_2ADDR:
jeffhaobabda952012-08-02 15:55:30 -070097 case Instruction::REM_DOUBLE:
buzbee408ad162012-06-06 16:45:18 -070098 return genArithOpDoublePortable(cUnit, opcode, rlDest, rlSrc1, rlSrc2);
Ian Rogersb5d09b22012-03-06 22:14:17 -080099 default:
100 return true;
101 }
102 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
103 DCHECK(rlSrc1.wide);
104 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
105 DCHECK(rlSrc2.wide);
106 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
107 DCHECK(rlDest.wide);
108 DCHECK(rlResult.wide);
buzbeef0504cd2012-11-13 16:31:10 -0800109 int rDest = s2d(rlResult.lowReg, rlResult.highReg);
110 int rSrc1 = s2d(rlSrc1.lowReg, rlSrc1.highReg);
111 int rSrc2 = s2d(rlSrc2.lowReg, rlSrc2.highReg);
jeffhao4abb1a92012-06-08 17:02:08 -0700112 if (rDest == rSrc2) {
buzbeef0504cd2012-11-13 16:31:10 -0800113 rSrc2 = oatAllocTempDouble(cUnit) | X86_FP_DOUBLE;
jeffhao4abb1a92012-06-08 17:02:08 -0700114 opRegCopy(cUnit, rSrc2, rDest);
115 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800116 opRegCopy(cUnit, rDest, rSrc1);
117 newLIR2(cUnit, op, rDest, rSrc2);
118 storeValueWide(cUnit, rlDest, rlResult);
119 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800120}
121
buzbeeeaf09bc2012-11-15 14:51:41 -0800122bool genConversion(CompilationUnit *cUnit, Instruction::Code opcode,
123 RegLocation rlDest, RegLocation rlSrc) {
jeffhao5121e0b2012-05-08 18:23:38 -0700124 RegisterClass rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800125 X86OpCode op = kX86Nop;
126 int srcReg;
127 RegLocation rlResult;
128 switch (opcode) {
129 case Instruction::INT_TO_FLOAT:
jeffhao5121e0b2012-05-08 18:23:38 -0700130 rcSrc = kCoreReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800131 op = kX86Cvtsi2ssRR;
132 break;
133 case Instruction::DOUBLE_TO_FLOAT:
jeffhao5121e0b2012-05-08 18:23:38 -0700134 rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800135 op = kX86Cvtsd2ssRR;
136 break;
137 case Instruction::FLOAT_TO_DOUBLE:
jeffhao5121e0b2012-05-08 18:23:38 -0700138 rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800139 op = kX86Cvtss2sdRR;
140 break;
141 case Instruction::INT_TO_DOUBLE:
jeffhao5121e0b2012-05-08 18:23:38 -0700142 rcSrc = kCoreReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800143 op = kX86Cvtsi2sdRR;
144 break;
jeffhao292188d2012-05-17 15:45:04 -0700145 case Instruction::FLOAT_TO_INT: {
jeffhao41005dd2012-05-09 17:58:52 -0700146 rlSrc = loadValue(cUnit, rlSrc, kFPReg);
147 srcReg = rlSrc.lowReg;
jeffhao41005dd2012-05-09 17:58:52 -0700148 oatClobberSReg(cUnit, rlDest.sRegLow);
149 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
jeffhao292188d2012-05-17 15:45:04 -0700150 int tempReg = oatAllocTempFloat(cUnit);
jeffhao41005dd2012-05-09 17:58:52 -0700151
152 loadConstant(cUnit, rlResult.lowReg, 0x7fffffff);
153 newLIR2(cUnit, kX86Cvtsi2ssRR, tempReg, rlResult.lowReg);
154 newLIR2(cUnit, kX86ComissRR, srcReg, tempReg);
jeffhao292188d2012-05-17 15:45:04 -0700155 LIR* branchPosOverflow = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
156 LIR* branchNaN = newLIR2(cUnit, kX86Jcc8, 0, kX86CondP);
157 newLIR2(cUnit, kX86Cvttss2siRR, rlResult.lowReg, srcReg);
158 LIR* branchNormal = newLIR1(cUnit, kX86Jmp8, 0);
159 branchNaN->target = newLIR0(cUnit, kPseudoTargetLabel);
160 newLIR2(cUnit, kX86Xor32RR, rlResult.lowReg, rlResult.lowReg);
161 branchPosOverflow->target = newLIR0(cUnit, kPseudoTargetLabel);
162 branchNormal->target = newLIR0(cUnit, kPseudoTargetLabel);
jeffhao41005dd2012-05-09 17:58:52 -0700163 storeValue(cUnit, rlDest, rlResult);
164 return false;
jeffhao292188d2012-05-17 15:45:04 -0700165 }
166 case Instruction::DOUBLE_TO_INT: {
jeffhao41005dd2012-05-09 17:58:52 -0700167 rlSrc = loadValueWide(cUnit, rlSrc, kFPReg);
168 srcReg = rlSrc.lowReg;
jeffhao41005dd2012-05-09 17:58:52 -0700169 oatClobberSReg(cUnit, rlDest.sRegLow);
170 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
buzbeef0504cd2012-11-13 16:31:10 -0800171 int tempReg = oatAllocTempDouble(cUnit) | X86_FP_DOUBLE;
jeffhao41005dd2012-05-09 17:58:52 -0700172
173 loadConstant(cUnit, rlResult.lowReg, 0x7fffffff);
174 newLIR2(cUnit, kX86Cvtsi2sdRR, tempReg, rlResult.lowReg);
175 newLIR2(cUnit, kX86ComisdRR, srcReg, tempReg);
jeffhao292188d2012-05-17 15:45:04 -0700176 LIR* branchPosOverflow = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
177 LIR* branchNaN = newLIR2(cUnit, kX86Jcc8, 0, kX86CondP);
178 newLIR2(cUnit, kX86Cvttsd2siRR, rlResult.lowReg, srcReg);
179 LIR* branchNormal = newLIR1(cUnit, kX86Jmp8, 0);
180 branchNaN->target = newLIR0(cUnit, kPseudoTargetLabel);
181 newLIR2(cUnit, kX86Xor32RR, rlResult.lowReg, rlResult.lowReg);
182 branchPosOverflow->target = newLIR0(cUnit, kPseudoTargetLabel);
183 branchNormal->target = newLIR0(cUnit, kPseudoTargetLabel);
jeffhao41005dd2012-05-09 17:58:52 -0700184 storeValue(cUnit, rlDest, rlResult);
185 return false;
jeffhao292188d2012-05-17 15:45:04 -0700186 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800187 case Instruction::LONG_TO_DOUBLE:
Ian Rogersb5d09b22012-03-06 22:14:17 -0800188 case Instruction::LONG_TO_FLOAT:
jeffhaobabda952012-08-02 15:55:30 -0700189 // TODO: inline by using memory as a 64-bit source. Be careful about promoted registers.
jeffhao41005dd2012-05-09 17:58:52 -0700190 case Instruction::FLOAT_TO_LONG:
Ian Rogersb5d09b22012-03-06 22:14:17 -0800191 case Instruction::DOUBLE_TO_LONG:
buzbee408ad162012-06-06 16:45:18 -0700192 return genConversionPortable(cUnit, opcode, rlDest, rlSrc);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800193 default:
194 return true;
195 }
buzbee408ad162012-06-06 16:45:18 -0700196 if (rlSrc.wide) {
jeffhao5121e0b2012-05-08 18:23:38 -0700197 rlSrc = loadValueWide(cUnit, rlSrc, rcSrc);
buzbeef0504cd2012-11-13 16:31:10 -0800198 srcReg = s2d(rlSrc.lowReg, rlSrc.highReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800199 } else {
jeffhao5121e0b2012-05-08 18:23:38 -0700200 rlSrc = loadValue(cUnit, rlSrc, rcSrc);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800201 srcReg = rlSrc.lowReg;
202 }
buzbee408ad162012-06-06 16:45:18 -0700203 if (rlDest.wide) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800204 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
buzbeef0504cd2012-11-13 16:31:10 -0800205 newLIR2(cUnit, op, s2d(rlResult.lowReg, rlResult.highReg), srcReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800206 storeValueWide(cUnit, rlDest, rlResult);
207 } else {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800208 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
209 newLIR2(cUnit, op, rlResult.lowReg, srcReg);
210 storeValue(cUnit, rlDest, rlResult);
211 }
212 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800213}
214
buzbeeeaf09bc2012-11-15 14:51:41 -0800215bool genCmpFP(CompilationUnit *cUnit, Instruction::Code code, RegLocation rlDest,
216 RegLocation rlSrc1, RegLocation rlSrc2) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800217 bool single = (code == Instruction::CMPL_FLOAT) || (code == Instruction::CMPG_FLOAT);
218 bool unorderedGt = (code == Instruction::CMPG_DOUBLE) || (code == Instruction::CMPG_FLOAT);
219 int srcReg1;
220 int srcReg2;
221 if (single) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800222 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
223 srcReg1 = rlSrc1.lowReg;
jeffhao644d5312012-05-03 19:04:49 -0700224 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
225 srcReg2 = rlSrc2.lowReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800226 } else {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800227 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
buzbeef0504cd2012-11-13 16:31:10 -0800228 srcReg1 = s2d(rlSrc1.lowReg, rlSrc1.highReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800229 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
buzbeef0504cd2012-11-13 16:31:10 -0800230 srcReg2 = s2d(rlSrc2.lowReg, rlSrc2.highReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800231 }
jeffhao41005dd2012-05-09 17:58:52 -0700232 oatClobberSReg(cUnit, rlDest.sRegLow);
Ian Rogersc6f3bb82012-03-21 20:40:33 -0700233 RegLocation rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
234 loadConstantNoClobber(cUnit, rlResult.lowReg, unorderedGt ? 1 : 0);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800235 if (single) {
236 newLIR2(cUnit, kX86UcomissRR, srcReg1, srcReg2);
237 } else {
238 newLIR2(cUnit, kX86UcomisdRR, srcReg1, srcReg2);
239 }
240 LIR* branch = NULL;
241 if (unorderedGt) {
Ian Rogersb41b33b2012-03-20 14:22:54 -0700242 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800243 }
jeffhao703f2cd2012-07-13 17:25:52 -0700244 // If the result reg can't be byte accessed, use a jump and move instead of a set.
245 if (rlResult.lowReg >= 4) {
246 LIR* branch2 = NULL;
247 if (unorderedGt) {
248 branch2 = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
249 newLIR2(cUnit, kX86Mov32RI, rlResult.lowReg, 0x0);
250 } else {
251 branch2 = newLIR2(cUnit, kX86Jcc8, 0, kX86CondBe);
252 newLIR2(cUnit, kX86Mov32RI, rlResult.lowReg, 0x1);
253 }
254 branch2->target = newLIR0(cUnit, kPseudoTargetLabel);
255 } else {
256 newLIR2(cUnit, kX86Set8R, rlResult.lowReg, kX86CondA /* above - unsigned > */);
257 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800258 newLIR2(cUnit, kX86Sbb32RI, rlResult.lowReg, 0);
259 if (unorderedGt) {
260 branch->target = newLIR0(cUnit, kPseudoTargetLabel);
261 }
jeffhao644d5312012-05-03 19:04:49 -0700262 storeValue(cUnit, rlDest, rlResult);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800263 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800264}
265
jeffhao4b771a02012-07-25 15:07:21 -0700266void genFusedFPCmpBranch(CompilationUnit* cUnit, BasicBlock* bb, MIR* mir,
267 bool gtBias, bool isDouble) {
268 LIR* labelList = cUnit->blockLabelList;
269 LIR* taken = &labelList[bb->taken->id];
270 LIR* notTaken = &labelList[bb->fallThrough->id];
271 LIR* branch = NULL;
272 RegLocation rlSrc1;
273 RegLocation rlSrc2;
274 if (isDouble) {
275 rlSrc1 = oatGetSrcWide(cUnit, mir, 0);
276 rlSrc2 = oatGetSrcWide(cUnit, mir, 2);
277 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
278 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
buzbeef0504cd2012-11-13 16:31:10 -0800279 newLIR2(cUnit, kX86UcomisdRR, s2d(rlSrc1.lowReg, rlSrc1.highReg),
280 s2d(rlSrc2.lowReg, rlSrc2.highReg));
jeffhao4b771a02012-07-25 15:07:21 -0700281 } else {
282 rlSrc1 = oatGetSrc(cUnit, mir, 0);
283 rlSrc2 = oatGetSrc(cUnit, mir, 1);
284 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
285 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
286 newLIR2(cUnit, kX86UcomissRR, rlSrc1.lowReg, rlSrc2.lowReg);
287 }
288 ConditionCode ccode = static_cast<ConditionCode>(mir->dalvikInsn.arg[0]);
289 switch (ccode) {
290 case kCondEq:
jeffhao0e3ac142012-08-03 18:24:38 -0700291 if (!gtBias) {
jeffhao4b771a02012-07-25 15:07:21 -0700292 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
293 branch->target = notTaken;
294 }
295 break;
296 case kCondNe:
297 if (!gtBias) {
298 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
299 branch->target = taken;
300 }
301 break;
302 case kCondLt:
303 if (gtBias) {
304 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
305 branch->target = notTaken;
306 }
307 ccode = kCondCs;
308 break;
309 case kCondLe:
310 if (gtBias) {
311 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
312 branch->target = notTaken;
313 }
314 ccode = kCondLs;
315 break;
316 case kCondGt:
317 if (gtBias) {
318 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
319 branch->target = taken;
320 }
321 ccode = kCondHi;
322 break;
323 case kCondGe:
324 if (gtBias) {
325 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
326 branch->target = taken;
327 }
328 ccode = kCondCc;
329 break;
330 default:
buzbeecbd6d442012-11-17 14:11:25 -0800331 LOG(FATAL) << "Unexpected ccode: " << ccode;
jeffhao4b771a02012-07-25 15:07:21 -0700332 }
333 opCondBranch(cUnit, ccode, taken);
334}
335
buzbeeefc63692012-11-14 16:31:52 -0800336void genNegFloat(CompilationUnit *cUnit, RegLocation rlDest, RegLocation rlSrc)
337{
338 RegLocation rlResult;
339 rlSrc = loadValue(cUnit, rlSrc, kCoreReg);
340 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
341 opRegRegImm(cUnit, kOpAdd, rlResult.lowReg, rlSrc.lowReg, 0x80000000);
342 storeValue(cUnit, rlDest, rlResult);
343}
344
345void genNegDouble(CompilationUnit *cUnit, RegLocation rlDest, RegLocation rlSrc)
346{
347 RegLocation rlResult;
348 rlSrc = loadValueWide(cUnit, rlSrc, kCoreReg);
349 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
350 opRegRegImm(cUnit, kOpAdd, rlResult.highReg, rlSrc.highReg, 0x80000000);
351 opRegCopy(cUnit, rlResult.lowReg, rlSrc.lowReg);
352 storeValueWide(cUnit, rlDest, rlResult);
353}
354
355bool genInlinedSqrt(CompilationUnit* cUnit, CallInfo* info) {
356 DCHECK_NE(cUnit->instructionSet, kThumb2);
357 return false;
358}
359
360
361
buzbeee88dfbf2012-03-05 11:19:57 -0800362} // namespace art