blob: 460f56be8b6eef3573a0100cf668169e5a8a707b [file] [log] [blame]
buzbeee88dfbf2012-03-05 11:19:57 -08001/*
2 * Copyright (C) 2012 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17namespace art {
18
buzbee408ad162012-06-06 16:45:18 -070019static bool genArithOpFloat(CompilationUnit *cUnit, Instruction::Code opcode,
Bill Buzbeea114add2012-05-03 15:00:40 -070020 RegLocation rlDest, RegLocation rlSrc1,
21 RegLocation rlSrc2) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080022 X86OpCode op = kX86Nop;
23 RegLocation rlResult;
buzbeee88dfbf2012-03-05 11:19:57 -080024
Ian Rogersb5d09b22012-03-06 22:14:17 -080025 /*
26 * Don't attempt to optimize register usage since these opcodes call out to
27 * the handlers.
28 */
buzbee408ad162012-06-06 16:45:18 -070029 switch (opcode) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080030 case Instruction::ADD_FLOAT_2ADDR:
31 case Instruction::ADD_FLOAT:
32 op = kX86AddssRR;
33 break;
34 case Instruction::SUB_FLOAT_2ADDR:
35 case Instruction::SUB_FLOAT:
36 op = kX86SubssRR;
37 break;
38 case Instruction::DIV_FLOAT_2ADDR:
39 case Instruction::DIV_FLOAT:
40 op = kX86DivssRR;
41 break;
42 case Instruction::MUL_FLOAT_2ADDR:
43 case Instruction::MUL_FLOAT:
44 op = kX86MulssRR;
45 break;
46 case Instruction::NEG_FLOAT:
jeffhao292188d2012-05-17 15:45:04 -070047 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
48 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
49 newLIR2(cUnit, kX86XorpsRR, rlResult.lowReg, rlResult.lowReg);
50 newLIR2(cUnit, kX86SubssRR, rlResult.lowReg, rlSrc1.lowReg);
51 storeValue(cUnit, rlDest, rlResult);
52 return false;
Ian Rogersb5d09b22012-03-06 22:14:17 -080053 case Instruction::REM_FLOAT_2ADDR:
54 case Instruction::REM_FLOAT: {
buzbee408ad162012-06-06 16:45:18 -070055 return genArithOpFloatPortable(cUnit, opcode, rlDest, rlSrc1, rlSrc2);
buzbeee88dfbf2012-03-05 11:19:57 -080056 }
Ian Rogersb5d09b22012-03-06 22:14:17 -080057 default:
58 return true;
59 }
60 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
61 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
62 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
63 int rDest = rlResult.lowReg;
64 int rSrc1 = rlSrc1.lowReg;
65 int rSrc2 = rlSrc2.lowReg;
66 // TODO: at least CHECK_NE(rDest, rSrc2);
67 opRegCopy(cUnit, rDest, rSrc1);
68 newLIR2(cUnit, op, rDest, rSrc2);
69 storeValue(cUnit, rlDest, rlResult);
buzbeee88dfbf2012-03-05 11:19:57 -080070
Ian Rogersb5d09b22012-03-06 22:14:17 -080071 return false;
buzbeee88dfbf2012-03-05 11:19:57 -080072}
73
buzbee408ad162012-06-06 16:45:18 -070074static bool genArithOpDouble(CompilationUnit *cUnit, Instruction::Code opcode,
buzbeee88dfbf2012-03-05 11:19:57 -080075 RegLocation rlDest, RegLocation rlSrc1,
Ian Rogersb5d09b22012-03-06 22:14:17 -080076 RegLocation rlSrc2) {
77 X86OpCode op = kX86Nop;
78 RegLocation rlResult;
buzbeee88dfbf2012-03-05 11:19:57 -080079
buzbee408ad162012-06-06 16:45:18 -070080 switch (opcode) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080081 case Instruction::ADD_DOUBLE_2ADDR:
82 case Instruction::ADD_DOUBLE:
83 op = kX86AddsdRR;
84 break;
85 case Instruction::SUB_DOUBLE_2ADDR:
86 case Instruction::SUB_DOUBLE:
87 op = kX86SubsdRR;
88 break;
89 case Instruction::DIV_DOUBLE_2ADDR:
90 case Instruction::DIV_DOUBLE:
91 op = kX86DivsdRR;
92 break;
93 case Instruction::MUL_DOUBLE_2ADDR:
94 case Instruction::MUL_DOUBLE:
95 op = kX86MulsdRR;
96 break;
97 case Instruction::NEG_DOUBLE:
jeffhao292188d2012-05-17 15:45:04 -070098 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
99 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
100 newLIR2(cUnit, kX86XorpsRR, rlResult.lowReg, rlResult.lowReg);
101 newLIR2(cUnit, kX86SubsdRR, rlResult.lowReg, rlSrc1.lowReg);
102 storeValueWide(cUnit, rlDest, rlResult);
103 return false;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800104 case Instruction::REM_DOUBLE_2ADDR:
105 case Instruction::REM_DOUBLE: {
buzbee408ad162012-06-06 16:45:18 -0700106 return genArithOpDoublePortable(cUnit, opcode, rlDest, rlSrc1, rlSrc2);
buzbeee88dfbf2012-03-05 11:19:57 -0800107 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800108 default:
109 return true;
110 }
111 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
112 DCHECK(rlSrc1.wide);
113 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
114 DCHECK(rlSrc2.wide);
115 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
116 DCHECK(rlDest.wide);
117 DCHECK(rlResult.wide);
118 int rDest = S2D(rlResult.lowReg, rlResult.highReg);
119 int rSrc1 = S2D(rlSrc1.lowReg, rlSrc1.highReg);
120 int rSrc2 = S2D(rlSrc2.lowReg, rlSrc2.highReg);
121 // TODO: at least CHECK_NE(rDest, rSrc2);
122 opRegCopy(cUnit, rDest, rSrc1);
123 newLIR2(cUnit, op, rDest, rSrc2);
124 storeValueWide(cUnit, rlDest, rlResult);
125 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800126}
127
buzbee408ad162012-06-06 16:45:18 -0700128static bool genConversion(CompilationUnit *cUnit, Instruction::Code opcode,
129 RegLocation rlDest, RegLocation rlSrc) {
jeffhao5121e0b2012-05-08 18:23:38 -0700130 RegisterClass rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800131 X86OpCode op = kX86Nop;
132 int srcReg;
133 RegLocation rlResult;
134 switch (opcode) {
135 case Instruction::INT_TO_FLOAT:
jeffhao5121e0b2012-05-08 18:23:38 -0700136 rcSrc = kCoreReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800137 op = kX86Cvtsi2ssRR;
138 break;
139 case Instruction::DOUBLE_TO_FLOAT:
jeffhao5121e0b2012-05-08 18:23:38 -0700140 rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800141 op = kX86Cvtsd2ssRR;
142 break;
143 case Instruction::FLOAT_TO_DOUBLE:
jeffhao5121e0b2012-05-08 18:23:38 -0700144 rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800145 op = kX86Cvtss2sdRR;
146 break;
147 case Instruction::INT_TO_DOUBLE:
jeffhao5121e0b2012-05-08 18:23:38 -0700148 rcSrc = kCoreReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800149 op = kX86Cvtsi2sdRR;
150 break;
jeffhao292188d2012-05-17 15:45:04 -0700151 case Instruction::FLOAT_TO_INT: {
jeffhao41005dd2012-05-09 17:58:52 -0700152 rlSrc = loadValue(cUnit, rlSrc, kFPReg);
153 srcReg = rlSrc.lowReg;
jeffhao41005dd2012-05-09 17:58:52 -0700154 oatClobberSReg(cUnit, rlDest.sRegLow);
155 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
jeffhao292188d2012-05-17 15:45:04 -0700156 int tempReg = oatAllocTempFloat(cUnit);
jeffhao41005dd2012-05-09 17:58:52 -0700157
158 loadConstant(cUnit, rlResult.lowReg, 0x7fffffff);
159 newLIR2(cUnit, kX86Cvtsi2ssRR, tempReg, rlResult.lowReg);
160 newLIR2(cUnit, kX86ComissRR, srcReg, tempReg);
jeffhao292188d2012-05-17 15:45:04 -0700161 LIR* branchPosOverflow = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
162 LIR* branchNaN = newLIR2(cUnit, kX86Jcc8, 0, kX86CondP);
163 newLIR2(cUnit, kX86Cvttss2siRR, rlResult.lowReg, srcReg);
164 LIR* branchNormal = newLIR1(cUnit, kX86Jmp8, 0);
165 branchNaN->target = newLIR0(cUnit, kPseudoTargetLabel);
166 newLIR2(cUnit, kX86Xor32RR, rlResult.lowReg, rlResult.lowReg);
167 branchPosOverflow->target = newLIR0(cUnit, kPseudoTargetLabel);
168 branchNormal->target = newLIR0(cUnit, kPseudoTargetLabel);
jeffhao41005dd2012-05-09 17:58:52 -0700169 storeValue(cUnit, rlDest, rlResult);
170 return false;
jeffhao292188d2012-05-17 15:45:04 -0700171 }
172 case Instruction::DOUBLE_TO_INT: {
jeffhao41005dd2012-05-09 17:58:52 -0700173 rlSrc = loadValueWide(cUnit, rlSrc, kFPReg);
174 srcReg = rlSrc.lowReg;
jeffhao41005dd2012-05-09 17:58:52 -0700175 oatClobberSReg(cUnit, rlDest.sRegLow);
176 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
jeffhao292188d2012-05-17 15:45:04 -0700177 int tempReg = oatAllocTempDouble(cUnit);
jeffhao41005dd2012-05-09 17:58:52 -0700178
179 loadConstant(cUnit, rlResult.lowReg, 0x7fffffff);
180 newLIR2(cUnit, kX86Cvtsi2sdRR, tempReg, rlResult.lowReg);
181 newLIR2(cUnit, kX86ComisdRR, srcReg, tempReg);
jeffhao292188d2012-05-17 15:45:04 -0700182 LIR* branchPosOverflow = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
183 LIR* branchNaN = newLIR2(cUnit, kX86Jcc8, 0, kX86CondP);
184 newLIR2(cUnit, kX86Cvttsd2siRR, rlResult.lowReg, srcReg);
185 LIR* branchNormal = newLIR1(cUnit, kX86Jmp8, 0);
186 branchNaN->target = newLIR0(cUnit, kPseudoTargetLabel);
187 newLIR2(cUnit, kX86Xor32RR, rlResult.lowReg, rlResult.lowReg);
188 branchPosOverflow->target = newLIR0(cUnit, kPseudoTargetLabel);
189 branchNormal->target = newLIR0(cUnit, kPseudoTargetLabel);
jeffhao41005dd2012-05-09 17:58:52 -0700190 storeValue(cUnit, rlDest, rlResult);
191 return false;
jeffhao292188d2012-05-17 15:45:04 -0700192 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800193 case Instruction::LONG_TO_DOUBLE:
Ian Rogersb5d09b22012-03-06 22:14:17 -0800194 case Instruction::LONG_TO_FLOAT:
jeffhao41005dd2012-05-09 17:58:52 -0700195 // These can be implemented inline by using memory as a 64-bit source.
196 // However, this can't be done easily if the register has been promoted.
197 UNIMPLEMENTED(WARNING) << "inline l2[df] " << PrettyMethod(cUnit->method_idx, *cUnit->dex_file);
198 case Instruction::FLOAT_TO_LONG:
Ian Rogersb5d09b22012-03-06 22:14:17 -0800199 case Instruction::DOUBLE_TO_LONG:
buzbee408ad162012-06-06 16:45:18 -0700200 return genConversionPortable(cUnit, opcode, rlDest, rlSrc);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800201 default:
202 return true;
203 }
buzbee408ad162012-06-06 16:45:18 -0700204 if (rlSrc.wide) {
jeffhao5121e0b2012-05-08 18:23:38 -0700205 rlSrc = loadValueWide(cUnit, rlSrc, rcSrc);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800206 srcReg = S2D(rlSrc.lowReg, rlSrc.highReg);
207 } else {
jeffhao5121e0b2012-05-08 18:23:38 -0700208 rlSrc = loadValue(cUnit, rlSrc, rcSrc);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800209 srcReg = rlSrc.lowReg;
210 }
buzbee408ad162012-06-06 16:45:18 -0700211 if (rlDest.wide) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800212 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
213 newLIR2(cUnit, op, S2D(rlResult.lowReg, rlResult.highReg), srcReg);
214 storeValueWide(cUnit, rlDest, rlResult);
215 } else {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800216 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
217 newLIR2(cUnit, op, rlResult.lowReg, srcReg);
218 storeValue(cUnit, rlDest, rlResult);
219 }
220 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800221}
222
buzbee408ad162012-06-06 16:45:18 -0700223static bool genCmpFP(CompilationUnit *cUnit, Instruction::Code code, RegLocation rlDest,
Ian Rogersb5d09b22012-03-06 22:14:17 -0800224 RegLocation rlSrc1, RegLocation rlSrc2) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800225 bool single = (code == Instruction::CMPL_FLOAT) || (code == Instruction::CMPG_FLOAT);
226 bool unorderedGt = (code == Instruction::CMPG_DOUBLE) || (code == Instruction::CMPG_FLOAT);
227 int srcReg1;
228 int srcReg2;
229 if (single) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800230 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
231 srcReg1 = rlSrc1.lowReg;
jeffhao644d5312012-05-03 19:04:49 -0700232 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
233 srcReg2 = rlSrc2.lowReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800234 } else {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800235 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
236 srcReg1 = S2D(rlSrc1.lowReg, rlSrc1.highReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800237 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
238 srcReg2 = S2D(rlSrc2.lowReg, rlSrc2.highReg);
239 }
jeffhao41005dd2012-05-09 17:58:52 -0700240 oatClobberSReg(cUnit, rlDest.sRegLow);
Ian Rogersc6f3bb82012-03-21 20:40:33 -0700241 RegLocation rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
242 loadConstantNoClobber(cUnit, rlResult.lowReg, unorderedGt ? 1 : 0);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800243 if (single) {
244 newLIR2(cUnit, kX86UcomissRR, srcReg1, srcReg2);
245 } else {
246 newLIR2(cUnit, kX86UcomisdRR, srcReg1, srcReg2);
247 }
248 LIR* branch = NULL;
249 if (unorderedGt) {
Ian Rogersb41b33b2012-03-20 14:22:54 -0700250 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800251 }
252 newLIR2(cUnit, kX86Set8R, rlResult.lowReg, kX86CondA /* above - unsigned > */);
253 newLIR2(cUnit, kX86Sbb32RI, rlResult.lowReg, 0);
254 if (unorderedGt) {
255 branch->target = newLIR0(cUnit, kPseudoTargetLabel);
256 }
jeffhao644d5312012-05-03 19:04:49 -0700257 storeValue(cUnit, rlDest, rlResult);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800258 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800259}
260
261} // namespace art