blob: e6b47d2a3754599e19e0dd09eb3feba4b8d9b1c8 [file] [log] [blame]
buzbeee88dfbf2012-03-05 11:19:57 -08001/*
2 * Copyright (C) 2012 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17namespace art {
18
Bill Buzbeea114add2012-05-03 15:00:40 -070019static bool genArithOpFloat(CompilationUnit *cUnit, MIR *mir,
20 RegLocation rlDest, RegLocation rlSrc1,
21 RegLocation rlSrc2) {
Ian Rogersb5d09b22012-03-06 22:14:17 -080022 X86OpCode op = kX86Nop;
23 RegLocation rlResult;
buzbeee88dfbf2012-03-05 11:19:57 -080024
Ian Rogersb5d09b22012-03-06 22:14:17 -080025 /*
26 * Don't attempt to optimize register usage since these opcodes call out to
27 * the handlers.
28 */
29 switch (mir->dalvikInsn.opcode) {
30 case Instruction::ADD_FLOAT_2ADDR:
31 case Instruction::ADD_FLOAT:
32 op = kX86AddssRR;
33 break;
34 case Instruction::SUB_FLOAT_2ADDR:
35 case Instruction::SUB_FLOAT:
36 op = kX86SubssRR;
37 break;
38 case Instruction::DIV_FLOAT_2ADDR:
39 case Instruction::DIV_FLOAT:
40 op = kX86DivssRR;
41 break;
42 case Instruction::MUL_FLOAT_2ADDR:
43 case Instruction::MUL_FLOAT:
44 op = kX86MulssRR;
45 break;
46 case Instruction::NEG_FLOAT:
jeffhao292188d2012-05-17 15:45:04 -070047 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
48 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
49 newLIR2(cUnit, kX86XorpsRR, rlResult.lowReg, rlResult.lowReg);
50 newLIR2(cUnit, kX86SubssRR, rlResult.lowReg, rlSrc1.lowReg);
51 storeValue(cUnit, rlDest, rlResult);
52 return false;
Ian Rogersb5d09b22012-03-06 22:14:17 -080053 case Instruction::REM_FLOAT_2ADDR:
54 case Instruction::REM_FLOAT: {
55 return genArithOpFloatPortable(cUnit, mir, rlDest, rlSrc1, rlSrc2);
buzbeee88dfbf2012-03-05 11:19:57 -080056 }
Ian Rogersb5d09b22012-03-06 22:14:17 -080057 default:
58 return true;
59 }
60 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
61 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
62 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
63 int rDest = rlResult.lowReg;
64 int rSrc1 = rlSrc1.lowReg;
65 int rSrc2 = rlSrc2.lowReg;
66 // TODO: at least CHECK_NE(rDest, rSrc2);
67 opRegCopy(cUnit, rDest, rSrc1);
68 newLIR2(cUnit, op, rDest, rSrc2);
69 storeValue(cUnit, rlDest, rlResult);
buzbeee88dfbf2012-03-05 11:19:57 -080070
Ian Rogersb5d09b22012-03-06 22:14:17 -080071 return false;
buzbeee88dfbf2012-03-05 11:19:57 -080072}
73
74static bool genArithOpDouble(CompilationUnit *cUnit, MIR *mir,
75 RegLocation rlDest, RegLocation rlSrc1,
Ian Rogersb5d09b22012-03-06 22:14:17 -080076 RegLocation rlSrc2) {
77 X86OpCode op = kX86Nop;
78 RegLocation rlResult;
buzbeee88dfbf2012-03-05 11:19:57 -080079
Ian Rogersb5d09b22012-03-06 22:14:17 -080080 switch (mir->dalvikInsn.opcode) {
81 case Instruction::ADD_DOUBLE_2ADDR:
82 case Instruction::ADD_DOUBLE:
83 op = kX86AddsdRR;
84 break;
85 case Instruction::SUB_DOUBLE_2ADDR:
86 case Instruction::SUB_DOUBLE:
87 op = kX86SubsdRR;
88 break;
89 case Instruction::DIV_DOUBLE_2ADDR:
90 case Instruction::DIV_DOUBLE:
91 op = kX86DivsdRR;
92 break;
93 case Instruction::MUL_DOUBLE_2ADDR:
94 case Instruction::MUL_DOUBLE:
95 op = kX86MulsdRR;
96 break;
97 case Instruction::NEG_DOUBLE:
jeffhao292188d2012-05-17 15:45:04 -070098 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
99 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
100 newLIR2(cUnit, kX86XorpsRR, rlResult.lowReg, rlResult.lowReg);
101 newLIR2(cUnit, kX86SubsdRR, rlResult.lowReg, rlSrc1.lowReg);
102 storeValueWide(cUnit, rlDest, rlResult);
103 return false;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800104 case Instruction::REM_DOUBLE_2ADDR:
105 case Instruction::REM_DOUBLE: {
106 return genArithOpDoublePortable(cUnit, mir, rlDest, rlSrc1, rlSrc2);
buzbeee88dfbf2012-03-05 11:19:57 -0800107 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800108 default:
109 return true;
110 }
111 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
112 DCHECK(rlSrc1.wide);
113 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
114 DCHECK(rlSrc2.wide);
115 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
116 DCHECK(rlDest.wide);
117 DCHECK(rlResult.wide);
118 int rDest = S2D(rlResult.lowReg, rlResult.highReg);
119 int rSrc1 = S2D(rlSrc1.lowReg, rlSrc1.highReg);
120 int rSrc2 = S2D(rlSrc2.lowReg, rlSrc2.highReg);
121 // TODO: at least CHECK_NE(rDest, rSrc2);
122 opRegCopy(cUnit, rDest, rSrc1);
123 newLIR2(cUnit, op, rDest, rSrc2);
124 storeValueWide(cUnit, rlDest, rlResult);
125 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800126}
127
Ian Rogersb5d09b22012-03-06 22:14:17 -0800128static bool genConversion(CompilationUnit *cUnit, MIR *mir) {
129 Instruction::Code opcode = mir->dalvikInsn.opcode;
130 bool longSrc = false;
131 bool longDest = false;
jeffhao5121e0b2012-05-08 18:23:38 -0700132 RegisterClass rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800133 RegLocation rlSrc;
134 RegLocation rlDest;
135 X86OpCode op = kX86Nop;
136 int srcReg;
137 RegLocation rlResult;
138 switch (opcode) {
139 case Instruction::INT_TO_FLOAT:
140 longSrc = false;
141 longDest = false;
jeffhao5121e0b2012-05-08 18:23:38 -0700142 rcSrc = kCoreReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800143 op = kX86Cvtsi2ssRR;
144 break;
145 case Instruction::DOUBLE_TO_FLOAT:
146 longSrc = true;
147 longDest = false;
jeffhao5121e0b2012-05-08 18:23:38 -0700148 rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800149 op = kX86Cvtsd2ssRR;
150 break;
151 case Instruction::FLOAT_TO_DOUBLE:
152 longSrc = false;
153 longDest = true;
jeffhao5121e0b2012-05-08 18:23:38 -0700154 rcSrc = kFPReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800155 op = kX86Cvtss2sdRR;
156 break;
157 case Instruction::INT_TO_DOUBLE:
158 longSrc = false;
159 longDest = true;
jeffhao5121e0b2012-05-08 18:23:38 -0700160 rcSrc = kCoreReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800161 op = kX86Cvtsi2sdRR;
162 break;
jeffhao292188d2012-05-17 15:45:04 -0700163 case Instruction::FLOAT_TO_INT: {
jeffhao41005dd2012-05-09 17:58:52 -0700164 rlSrc = oatGetSrc(cUnit, mir, 0);
165 rlSrc = loadValue(cUnit, rlSrc, kFPReg);
166 srcReg = rlSrc.lowReg;
167 rlDest = oatGetDest(cUnit, mir, 0);
168 oatClobberSReg(cUnit, rlDest.sRegLow);
169 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
jeffhao292188d2012-05-17 15:45:04 -0700170 int tempReg = oatAllocTempFloat(cUnit);
jeffhao41005dd2012-05-09 17:58:52 -0700171
172 loadConstant(cUnit, rlResult.lowReg, 0x7fffffff);
173 newLIR2(cUnit, kX86Cvtsi2ssRR, tempReg, rlResult.lowReg);
174 newLIR2(cUnit, kX86ComissRR, srcReg, tempReg);
jeffhao292188d2012-05-17 15:45:04 -0700175 LIR* branchPosOverflow = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
176 LIR* branchNaN = newLIR2(cUnit, kX86Jcc8, 0, kX86CondP);
177 newLIR2(cUnit, kX86Cvttss2siRR, rlResult.lowReg, srcReg);
178 LIR* branchNormal = newLIR1(cUnit, kX86Jmp8, 0);
179 branchNaN->target = newLIR0(cUnit, kPseudoTargetLabel);
180 newLIR2(cUnit, kX86Xor32RR, rlResult.lowReg, rlResult.lowReg);
181 branchPosOverflow->target = newLIR0(cUnit, kPseudoTargetLabel);
182 branchNormal->target = newLIR0(cUnit, kPseudoTargetLabel);
jeffhao41005dd2012-05-09 17:58:52 -0700183 storeValue(cUnit, rlDest, rlResult);
184 return false;
jeffhao292188d2012-05-17 15:45:04 -0700185 }
186 case Instruction::DOUBLE_TO_INT: {
jeffhao41005dd2012-05-09 17:58:52 -0700187 rlSrc = oatGetSrcWide(cUnit, mir, 0, 1);
188 rlSrc = loadValueWide(cUnit, rlSrc, kFPReg);
189 srcReg = rlSrc.lowReg;
190 rlDest = oatGetDest(cUnit, mir, 0);
191 oatClobberSReg(cUnit, rlDest.sRegLow);
192 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
jeffhao292188d2012-05-17 15:45:04 -0700193 int tempReg = oatAllocTempDouble(cUnit);
jeffhao41005dd2012-05-09 17:58:52 -0700194
195 loadConstant(cUnit, rlResult.lowReg, 0x7fffffff);
196 newLIR2(cUnit, kX86Cvtsi2sdRR, tempReg, rlResult.lowReg);
197 newLIR2(cUnit, kX86ComisdRR, srcReg, tempReg);
jeffhao292188d2012-05-17 15:45:04 -0700198 LIR* branchPosOverflow = newLIR2(cUnit, kX86Jcc8, 0, kX86CondA);
199 LIR* branchNaN = newLIR2(cUnit, kX86Jcc8, 0, kX86CondP);
200 newLIR2(cUnit, kX86Cvttsd2siRR, rlResult.lowReg, srcReg);
201 LIR* branchNormal = newLIR1(cUnit, kX86Jmp8, 0);
202 branchNaN->target = newLIR0(cUnit, kPseudoTargetLabel);
203 newLIR2(cUnit, kX86Xor32RR, rlResult.lowReg, rlResult.lowReg);
204 branchPosOverflow->target = newLIR0(cUnit, kPseudoTargetLabel);
205 branchNormal->target = newLIR0(cUnit, kPseudoTargetLabel);
jeffhao41005dd2012-05-09 17:58:52 -0700206 storeValue(cUnit, rlDest, rlResult);
207 return false;
jeffhao292188d2012-05-17 15:45:04 -0700208 }
Ian Rogersb5d09b22012-03-06 22:14:17 -0800209 case Instruction::LONG_TO_DOUBLE:
Ian Rogersb5d09b22012-03-06 22:14:17 -0800210 case Instruction::LONG_TO_FLOAT:
jeffhao41005dd2012-05-09 17:58:52 -0700211 // These can be implemented inline by using memory as a 64-bit source.
212 // However, this can't be done easily if the register has been promoted.
213 UNIMPLEMENTED(WARNING) << "inline l2[df] " << PrettyMethod(cUnit->method_idx, *cUnit->dex_file);
214 case Instruction::FLOAT_TO_LONG:
Ian Rogersb5d09b22012-03-06 22:14:17 -0800215 case Instruction::DOUBLE_TO_LONG:
216 return genConversionPortable(cUnit, mir);
217 default:
218 return true;
219 }
220 if (longSrc) {
221 rlSrc = oatGetSrcWide(cUnit, mir, 0, 1);
jeffhao5121e0b2012-05-08 18:23:38 -0700222 rlSrc = loadValueWide(cUnit, rlSrc, rcSrc);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800223 srcReg = S2D(rlSrc.lowReg, rlSrc.highReg);
224 } else {
225 rlSrc = oatGetSrc(cUnit, mir, 0);
jeffhao5121e0b2012-05-08 18:23:38 -0700226 rlSrc = loadValue(cUnit, rlSrc, rcSrc);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800227 srcReg = rlSrc.lowReg;
228 }
229 if (longDest) {
230 rlDest = oatGetDestWide(cUnit, mir, 0, 1);
231 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
232 newLIR2(cUnit, op, S2D(rlResult.lowReg, rlResult.highReg), srcReg);
233 storeValueWide(cUnit, rlDest, rlResult);
234 } else {
235 rlDest = oatGetDest(cUnit, mir, 0);
236 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
237 newLIR2(cUnit, op, rlResult.lowReg, srcReg);
238 storeValue(cUnit, rlDest, rlResult);
239 }
240 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800241}
242
243static bool genCmpFP(CompilationUnit *cUnit, MIR *mir, RegLocation rlDest,
Ian Rogersb5d09b22012-03-06 22:14:17 -0800244 RegLocation rlSrc1, RegLocation rlSrc2) {
245 Instruction::Code code = mir->dalvikInsn.opcode;
246 bool single = (code == Instruction::CMPL_FLOAT) || (code == Instruction::CMPG_FLOAT);
247 bool unorderedGt = (code == Instruction::CMPG_DOUBLE) || (code == Instruction::CMPG_FLOAT);
248 int srcReg1;
249 int srcReg2;
250 if (single) {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800251 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
252 srcReg1 = rlSrc1.lowReg;
jeffhao644d5312012-05-03 19:04:49 -0700253 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
254 srcReg2 = rlSrc2.lowReg;
Ian Rogersb5d09b22012-03-06 22:14:17 -0800255 } else {
Ian Rogersb5d09b22012-03-06 22:14:17 -0800256 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
257 srcReg1 = S2D(rlSrc1.lowReg, rlSrc1.highReg);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800258 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
259 srcReg2 = S2D(rlSrc2.lowReg, rlSrc2.highReg);
260 }
jeffhao41005dd2012-05-09 17:58:52 -0700261 oatClobberSReg(cUnit, rlDest.sRegLow);
Ian Rogersc6f3bb82012-03-21 20:40:33 -0700262 RegLocation rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
263 loadConstantNoClobber(cUnit, rlResult.lowReg, unorderedGt ? 1 : 0);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800264 if (single) {
265 newLIR2(cUnit, kX86UcomissRR, srcReg1, srcReg2);
266 } else {
267 newLIR2(cUnit, kX86UcomisdRR, srcReg1, srcReg2);
268 }
269 LIR* branch = NULL;
270 if (unorderedGt) {
Ian Rogersb41b33b2012-03-20 14:22:54 -0700271 branch = newLIR2(cUnit, kX86Jcc8, 0, kX86CondPE);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800272 }
273 newLIR2(cUnit, kX86Set8R, rlResult.lowReg, kX86CondA /* above - unsigned > */);
274 newLIR2(cUnit, kX86Sbb32RI, rlResult.lowReg, 0);
275 if (unorderedGt) {
276 branch->target = newLIR0(cUnit, kPseudoTargetLabel);
277 }
jeffhao644d5312012-05-03 19:04:49 -0700278 storeValue(cUnit, rlDest, rlResult);
Ian Rogersb5d09b22012-03-06 22:14:17 -0800279 return false;
buzbeee88dfbf2012-03-05 11:19:57 -0800280}
281
282} // namespace art