blob: 0f9de5b604ba588ccc3de01cf7f54a83f864bf50 [file] [log] [blame]
Matteo Franchin43ec8732014-03-31 15:00:14 +01001/*
2 * Copyright (C) 2011 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "arm64_lir.h"
18#include "codegen_arm64.h"
19#include "dex/quick/mir_to_lir-inl.h"
20
21namespace art {
22
23void Arm64Mir2Lir::GenArithOpFloat(Instruction::Code opcode, RegLocation rl_dest,
Matteo Franchine45fb9e2014-05-06 10:10:30 +010024 RegLocation rl_src1, RegLocation rl_src2) {
25 int op = kA64Brk1d;
Matteo Franchin43ec8732014-03-31 15:00:14 +010026 RegLocation rl_result;
27
Matteo Franchin43ec8732014-03-31 15:00:14 +010028 switch (opcode) {
29 case Instruction::ADD_FLOAT_2ADDR:
30 case Instruction::ADD_FLOAT:
Matteo Franchine45fb9e2014-05-06 10:10:30 +010031 op = kA64Fadd3fff;
Matteo Franchin43ec8732014-03-31 15:00:14 +010032 break;
33 case Instruction::SUB_FLOAT_2ADDR:
34 case Instruction::SUB_FLOAT:
Matteo Franchine45fb9e2014-05-06 10:10:30 +010035 op = kA64Fsub3fff;
Matteo Franchin43ec8732014-03-31 15:00:14 +010036 break;
37 case Instruction::DIV_FLOAT_2ADDR:
38 case Instruction::DIV_FLOAT:
Matteo Franchine45fb9e2014-05-06 10:10:30 +010039 op = kA64Fdiv3fff;
Matteo Franchin43ec8732014-03-31 15:00:14 +010040 break;
41 case Instruction::MUL_FLOAT_2ADDR:
42 case Instruction::MUL_FLOAT:
Matteo Franchine45fb9e2014-05-06 10:10:30 +010043 op = kA64Fmul3fff;
Matteo Franchin43ec8732014-03-31 15:00:14 +010044 break;
45 case Instruction::REM_FLOAT_2ADDR:
46 case Instruction::REM_FLOAT:
47 FlushAllRegs(); // Send everything to home location
Andreas Gampe2f244e92014-05-08 03:35:25 -070048 CallRuntimeHelperRegLocationRegLocation(QUICK_ENTRYPOINT_OFFSET(8, pFmodf), rl_src1, rl_src2,
Matteo Franchin43ec8732014-03-31 15:00:14 +010049 false);
buzbeea0cd2d72014-06-01 09:33:49 -070050 rl_result = GetReturn(kFPReg);
Matteo Franchin43ec8732014-03-31 15:00:14 +010051 StoreValue(rl_dest, rl_result);
52 return;
53 case Instruction::NEG_FLOAT:
54 GenNegFloat(rl_dest, rl_src1);
55 return;
56 default:
57 LOG(FATAL) << "Unexpected opcode: " << opcode;
58 }
59 rl_src1 = LoadValue(rl_src1, kFPReg);
60 rl_src2 = LoadValue(rl_src2, kFPReg);
61 rl_result = EvalLoc(rl_dest, kFPReg, true);
62 NewLIR3(op, rl_result.reg.GetReg(), rl_src1.reg.GetReg(), rl_src2.reg.GetReg());
63 StoreValue(rl_dest, rl_result);
64}
65
66void Arm64Mir2Lir::GenArithOpDouble(Instruction::Code opcode,
Matteo Franchine45fb9e2014-05-06 10:10:30 +010067 RegLocation rl_dest, RegLocation rl_src1, RegLocation rl_src2) {
68 int op = kA64Brk1d;
Matteo Franchin43ec8732014-03-31 15:00:14 +010069 RegLocation rl_result;
70
71 switch (opcode) {
72 case Instruction::ADD_DOUBLE_2ADDR:
73 case Instruction::ADD_DOUBLE:
Matteo Franchine45fb9e2014-05-06 10:10:30 +010074 op = kA64Fadd3fff;
Matteo Franchin43ec8732014-03-31 15:00:14 +010075 break;
76 case Instruction::SUB_DOUBLE_2ADDR:
77 case Instruction::SUB_DOUBLE:
Matteo Franchine45fb9e2014-05-06 10:10:30 +010078 op = kA64Fsub3fff;
Matteo Franchin43ec8732014-03-31 15:00:14 +010079 break;
80 case Instruction::DIV_DOUBLE_2ADDR:
81 case Instruction::DIV_DOUBLE:
Matteo Franchine45fb9e2014-05-06 10:10:30 +010082 op = kA64Fdiv3fff;
Matteo Franchin43ec8732014-03-31 15:00:14 +010083 break;
84 case Instruction::MUL_DOUBLE_2ADDR:
85 case Instruction::MUL_DOUBLE:
Matteo Franchine45fb9e2014-05-06 10:10:30 +010086 op = kA64Fmul3fff;
Matteo Franchin43ec8732014-03-31 15:00:14 +010087 break;
88 case Instruction::REM_DOUBLE_2ADDR:
89 case Instruction::REM_DOUBLE:
90 FlushAllRegs(); // Send everything to home location
Zheng Xu2d41a652014-06-09 11:05:31 +080091 {
92 ThreadOffset<8> helper_offset = QUICK_ENTRYPOINT_OFFSET(8, pFmod);
93 RegStorage r_tgt = CallHelperSetup(helper_offset);
94 LoadValueDirectWideFixed(rl_src1, rs_d0);
95 LoadValueDirectWideFixed(rl_src2, rs_d1);
96 ClobberCallerSave();
97 CallHelper(r_tgt, helper_offset, false);
98 }
buzbeea0cd2d72014-06-01 09:33:49 -070099 rl_result = GetReturnWide(kFPReg);
Matteo Franchin43ec8732014-03-31 15:00:14 +0100100 StoreValueWide(rl_dest, rl_result);
101 return;
102 case Instruction::NEG_DOUBLE:
103 GenNegDouble(rl_dest, rl_src1);
104 return;
105 default:
106 LOG(FATAL) << "Unexpected opcode: " << opcode;
107 }
108
109 rl_src1 = LoadValueWide(rl_src1, kFPReg);
110 DCHECK(rl_src1.wide);
111 rl_src2 = LoadValueWide(rl_src2, kFPReg);
112 DCHECK(rl_src2.wide);
113 rl_result = EvalLoc(rl_dest, kFPReg, true);
114 DCHECK(rl_dest.wide);
115 DCHECK(rl_result.wide);
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100116 NewLIR3(FWIDE(op), rl_result.reg.GetReg(), rl_src1.reg.GetReg(), rl_src2.reg.GetReg());
Matteo Franchin43ec8732014-03-31 15:00:14 +0100117 StoreValueWide(rl_dest, rl_result);
118}
119
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100120void Arm64Mir2Lir::GenConversion(Instruction::Code opcode,
121 RegLocation rl_dest, RegLocation rl_src) {
122 int op = kA64Brk1d;
Matteo Franchin43ec8732014-03-31 15:00:14 +0100123 RegLocation rl_result;
Serban Constantinescu032d3772014-05-23 17:38:18 +0100124 RegisterClass src_reg_class = kInvalidRegClass;
125 RegisterClass dst_reg_class = kInvalidRegClass;
Matteo Franchin43ec8732014-03-31 15:00:14 +0100126
127 switch (opcode) {
128 case Instruction::INT_TO_FLOAT:
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100129 op = kA64Scvtf2fw;
Serban Constantinescu032d3772014-05-23 17:38:18 +0100130 src_reg_class = kCoreReg;
131 dst_reg_class = kFPReg;
Matteo Franchin43ec8732014-03-31 15:00:14 +0100132 break;
133 case Instruction::FLOAT_TO_INT:
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100134 op = kA64Fcvtzs2wf;
Serban Constantinescu032d3772014-05-23 17:38:18 +0100135 src_reg_class = kFPReg;
136 dst_reg_class = kCoreReg;
Matteo Franchin43ec8732014-03-31 15:00:14 +0100137 break;
138 case Instruction::DOUBLE_TO_FLOAT:
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100139 op = kA64Fcvt2sS;
Serban Constantinescu032d3772014-05-23 17:38:18 +0100140 src_reg_class = kFPReg;
141 dst_reg_class = kFPReg;
Matteo Franchin43ec8732014-03-31 15:00:14 +0100142 break;
143 case Instruction::FLOAT_TO_DOUBLE:
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100144 op = kA64Fcvt2Ss;
Serban Constantinescu032d3772014-05-23 17:38:18 +0100145 src_reg_class = kFPReg;
146 dst_reg_class = kFPReg;
Matteo Franchin43ec8732014-03-31 15:00:14 +0100147 break;
148 case Instruction::INT_TO_DOUBLE:
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100149 op = FWIDE(kA64Scvtf2fw);
Serban Constantinescu032d3772014-05-23 17:38:18 +0100150 src_reg_class = kCoreReg;
151 dst_reg_class = kFPReg;
Matteo Franchin43ec8732014-03-31 15:00:14 +0100152 break;
153 case Instruction::DOUBLE_TO_INT:
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100154 op = FWIDE(kA64Fcvtzs2wf);
Serban Constantinescu032d3772014-05-23 17:38:18 +0100155 src_reg_class = kFPReg;
156 dst_reg_class = kCoreReg;
Matteo Franchin43ec8732014-03-31 15:00:14 +0100157 break;
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100158 case Instruction::LONG_TO_DOUBLE:
159 op = FWIDE(kA64Scvtf2fx);
Serban Constantinescu032d3772014-05-23 17:38:18 +0100160 src_reg_class = kCoreReg;
161 dst_reg_class = kFPReg;
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100162 break;
Matteo Franchin43ec8732014-03-31 15:00:14 +0100163 case Instruction::FLOAT_TO_LONG:
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100164 op = kA64Fcvtzs2xf;
Serban Constantinescu032d3772014-05-23 17:38:18 +0100165 src_reg_class = kFPReg;
166 dst_reg_class = kCoreReg;
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100167 break;
168 case Instruction::LONG_TO_FLOAT:
169 op = kA64Scvtf2fx;
Serban Constantinescu032d3772014-05-23 17:38:18 +0100170 src_reg_class = kCoreReg;
171 dst_reg_class = kFPReg;
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100172 break;
Matteo Franchin43ec8732014-03-31 15:00:14 +0100173 case Instruction::DOUBLE_TO_LONG:
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100174 op = FWIDE(kA64Fcvtzs2xf);
Serban Constantinescu032d3772014-05-23 17:38:18 +0100175 src_reg_class = kFPReg;
176 dst_reg_class = kCoreReg;
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100177 break;
Matteo Franchin43ec8732014-03-31 15:00:14 +0100178 default:
179 LOG(FATAL) << "Unexpected opcode: " << opcode;
180 }
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100181
Serban Constantinescu032d3772014-05-23 17:38:18 +0100182 DCHECK_NE(src_reg_class, kInvalidRegClass);
183 DCHECK_NE(dst_reg_class, kInvalidRegClass);
184 DCHECK_NE(op, kA64Brk1d);
185
Matteo Franchin43ec8732014-03-31 15:00:14 +0100186 if (rl_src.wide) {
Serban Constantinescu032d3772014-05-23 17:38:18 +0100187 rl_src = LoadValueWide(rl_src, src_reg_class);
Matteo Franchin43ec8732014-03-31 15:00:14 +0100188 } else {
Serban Constantinescu032d3772014-05-23 17:38:18 +0100189 rl_src = LoadValue(rl_src, src_reg_class);
Matteo Franchin43ec8732014-03-31 15:00:14 +0100190 }
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100191
Serban Constantinescu032d3772014-05-23 17:38:18 +0100192 rl_result = EvalLoc(rl_dest, dst_reg_class, true);
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100193 NewLIR2(op, rl_result.reg.GetReg(), rl_src.reg.GetReg());
194
Matteo Franchin43ec8732014-03-31 15:00:14 +0100195 if (rl_dest.wide) {
Matteo Franchin43ec8732014-03-31 15:00:14 +0100196 StoreValueWide(rl_dest, rl_result);
197 } else {
Matteo Franchin43ec8732014-03-31 15:00:14 +0100198 StoreValue(rl_dest, rl_result);
199 }
200}
201
202void Arm64Mir2Lir::GenFusedFPCmpBranch(BasicBlock* bb, MIR* mir, bool gt_bias,
203 bool is_double) {
204 LIR* target = &block_label_list_[bb->taken];
205 RegLocation rl_src1;
206 RegLocation rl_src2;
207 if (is_double) {
208 rl_src1 = mir_graph_->GetSrcWide(mir, 0);
209 rl_src2 = mir_graph_->GetSrcWide(mir, 2);
210 rl_src1 = LoadValueWide(rl_src1, kFPReg);
211 rl_src2 = LoadValueWide(rl_src2, kFPReg);
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100212 NewLIR2(FWIDE(kA64Fcmp2ff), rl_src1.reg.GetReg(), rl_src2.reg.GetReg());
Matteo Franchin43ec8732014-03-31 15:00:14 +0100213 } else {
214 rl_src1 = mir_graph_->GetSrc(mir, 0);
215 rl_src2 = mir_graph_->GetSrc(mir, 1);
216 rl_src1 = LoadValue(rl_src1, kFPReg);
217 rl_src2 = LoadValue(rl_src2, kFPReg);
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100218 NewLIR2(kA64Fcmp2ff, rl_src1.reg.GetReg(), rl_src2.reg.GetReg());
Matteo Franchin43ec8732014-03-31 15:00:14 +0100219 }
Matteo Franchin43ec8732014-03-31 15:00:14 +0100220 ConditionCode ccode = mir->meta.ccode;
221 switch (ccode) {
222 case kCondEq:
223 case kCondNe:
224 break;
225 case kCondLt:
226 if (gt_bias) {
227 ccode = kCondMi;
228 }
229 break;
230 case kCondLe:
231 if (gt_bias) {
232 ccode = kCondLs;
233 }
234 break;
235 case kCondGt:
236 if (gt_bias) {
237 ccode = kCondHi;
238 }
239 break;
240 case kCondGe:
241 if (gt_bias) {
242 ccode = kCondUge;
243 }
244 break;
245 default:
246 LOG(FATAL) << "Unexpected ccode: " << ccode;
247 }
248 OpCondBranch(ccode, target);
249}
250
251
252void Arm64Mir2Lir::GenCmpFP(Instruction::Code opcode, RegLocation rl_dest,
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100253 RegLocation rl_src1, RegLocation rl_src2) {
Matteo Franchin43ec8732014-03-31 15:00:14 +0100254 bool is_double = false;
255 int default_result = -1;
256 RegLocation rl_result;
257
258 switch (opcode) {
259 case Instruction::CMPL_FLOAT:
260 is_double = false;
261 default_result = -1;
262 break;
263 case Instruction::CMPG_FLOAT:
264 is_double = false;
265 default_result = 1;
266 break;
267 case Instruction::CMPL_DOUBLE:
268 is_double = true;
269 default_result = -1;
270 break;
271 case Instruction::CMPG_DOUBLE:
272 is_double = true;
273 default_result = 1;
274 break;
275 default:
276 LOG(FATAL) << "Unexpected opcode: " << opcode;
277 }
278 if (is_double) {
279 rl_src1 = LoadValueWide(rl_src1, kFPReg);
280 rl_src2 = LoadValueWide(rl_src2, kFPReg);
281 // In case result vreg is also a src vreg, break association to avoid useless copy by EvalLoc()
282 ClobberSReg(rl_dest.s_reg_low);
283 rl_result = EvalLoc(rl_dest, kCoreReg, true);
284 LoadConstant(rl_result.reg, default_result);
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100285 NewLIR2(FWIDE(kA64Fcmp2ff), rl_src1.reg.GetReg(), rl_src2.reg.GetReg());
Matteo Franchin43ec8732014-03-31 15:00:14 +0100286 } else {
287 rl_src1 = LoadValue(rl_src1, kFPReg);
288 rl_src2 = LoadValue(rl_src2, kFPReg);
289 // In case result vreg is also a srcvreg, break association to avoid useless copy by EvalLoc()
290 ClobberSReg(rl_dest.s_reg_low);
291 rl_result = EvalLoc(rl_dest, kCoreReg, true);
292 LoadConstant(rl_result.reg, default_result);
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100293 NewLIR2(kA64Fcmp2ff, rl_src1.reg.GetReg(), rl_src2.reg.GetReg());
Matteo Franchin43ec8732014-03-31 15:00:14 +0100294 }
295 DCHECK(!rl_result.reg.IsFloat());
Matteo Franchin43ec8732014-03-31 15:00:14 +0100296
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100297 // TODO(Arm64): should we rather do this?
298 // csinc wD, wzr, wzr, eq
299 // csneg wD, wD, wD, le
300 // (which requires 2 instructions rather than 3)
Matteo Franchin43ec8732014-03-31 15:00:14 +0100301
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100302 // Rd = if cond then Rd else -Rd.
303 NewLIR4(kA64Csneg4rrrc, rl_result.reg.GetReg(), rl_result.reg.GetReg(),
304 rl_result.reg.GetReg(), (default_result == 1) ? kArmCondPl : kArmCondLe);
305 NewLIR4(kA64Csel4rrrc, rl_result.reg.GetReg(), rwzr, rl_result.reg.GetReg(),
306 kArmCondEq);
Matteo Franchin43ec8732014-03-31 15:00:14 +0100307 StoreValue(rl_dest, rl_result);
308}
309
310void Arm64Mir2Lir::GenNegFloat(RegLocation rl_dest, RegLocation rl_src) {
311 RegLocation rl_result;
312 rl_src = LoadValue(rl_src, kFPReg);
313 rl_result = EvalLoc(rl_dest, kFPReg, true);
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100314 NewLIR2(kA64Fneg2ff, rl_result.reg.GetReg(), rl_src.reg.GetReg());
Matteo Franchin43ec8732014-03-31 15:00:14 +0100315 StoreValue(rl_dest, rl_result);
316}
317
318void Arm64Mir2Lir::GenNegDouble(RegLocation rl_dest, RegLocation rl_src) {
319 RegLocation rl_result;
320 rl_src = LoadValueWide(rl_src, kFPReg);
321 rl_result = EvalLoc(rl_dest, kFPReg, true);
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100322 NewLIR2(FWIDE(kA64Fneg2ff), rl_result.reg.GetReg(), rl_src.reg.GetReg());
Matteo Franchin43ec8732014-03-31 15:00:14 +0100323 StoreValueWide(rl_dest, rl_result);
324}
325
326bool Arm64Mir2Lir::GenInlinedSqrt(CallInfo* info) {
Matteo Franchin43ec8732014-03-31 15:00:14 +0100327 RegLocation rl_src = info->args[0];
328 RegLocation rl_dest = InlineTargetWide(info); // double place for result
329 rl_src = LoadValueWide(rl_src, kFPReg);
330 RegLocation rl_result = EvalLoc(rl_dest, kFPReg, true);
Matteo Franchine45fb9e2014-05-06 10:10:30 +0100331 NewLIR2(FWIDE(kA64Fsqrt2ff), rl_result.reg.GetReg(), rl_src.reg.GetReg());
Matteo Franchin43ec8732014-03-31 15:00:14 +0100332 StoreValueWide(rl_dest, rl_result);
333 return true;
334}
335
Serban Constantinescu23abec92014-07-02 16:13:38 +0100336bool Arm64Mir2Lir::GenInlinedMinMaxFP(CallInfo* info, bool is_min, bool is_double) {
337 DCHECK_EQ(cu_->instruction_set, kArm64);
338 int op = (is_min) ? kA64Fmin3fff : kA64Fmax3fff;
339 ArmOpcode wide = (is_double) ? FWIDE(0) : FUNWIDE(0);
340 RegLocation rl_src1 = info->args[0];
341 RegLocation rl_src2 = (is_double) ? info->args[2] : info->args[1];
342 rl_src1 = (is_double) ? LoadValueWide(rl_src1, kFPReg) : LoadValue(rl_src1, kFPReg);
343 rl_src2 = (is_double) ? LoadValueWide(rl_src2, kFPReg) : LoadValue(rl_src2, kFPReg);
344 RegLocation rl_dest = (is_double) ? InlineTargetWide(info) : InlineTarget(info);
345 RegLocation rl_result = EvalLoc(rl_dest, kFPReg, true);
346 NewLIR3(op | wide, rl_result.reg.GetReg(), rl_src1.reg.GetReg(), rl_src2.reg.GetReg());
347 (is_double) ? StoreValueWide(rl_dest, rl_result) : StoreValue(rl_dest, rl_result);
348 return true;
349}
350
Matteo Franchin43ec8732014-03-31 15:00:14 +0100351} // namespace art