blob: 3b0d540db0fd2342a663a9a9b1a7383efe9f7bbe [file] [log] [blame]
buzbee67bf8852011-08-17 17:51:35 -07001/*
2 * Copyright (C) 2011 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
buzbee1bc37c62012-11-20 13:35:41 -080017#include "arm_lir.h"
18#include "../codegen_util.h"
19#include "../ralloc_util.h"
20
Elliott Hughes11d1b0c2012-01-23 16:57:47 -080021namespace art {
22
buzbee408ad162012-06-06 16:45:18 -070023bool genArithOpFloat(CompilationUnit* cUnit, Instruction::Code opcode, RegLocation rlDest,
buzbee31a4a6f2012-02-28 15:36:15 -080024 RegLocation rlSrc1, RegLocation rlSrc2)
buzbee67bf8852011-08-17 17:51:35 -070025{
Bill Buzbeea114add2012-05-03 15:00:40 -070026 int op = kThumbBkpt;
27 RegLocation rlResult;
buzbee67bf8852011-08-17 17:51:35 -070028
Bill Buzbeea114add2012-05-03 15:00:40 -070029 /*
30 * Don't attempt to optimize register usage since these opcodes call out to
31 * the handlers.
32 */
buzbee408ad162012-06-06 16:45:18 -070033 switch (opcode) {
Bill Buzbeea114add2012-05-03 15:00:40 -070034 case Instruction::ADD_FLOAT_2ADDR:
35 case Instruction::ADD_FLOAT:
36 op = kThumb2Vadds;
37 break;
38 case Instruction::SUB_FLOAT_2ADDR:
39 case Instruction::SUB_FLOAT:
40 op = kThumb2Vsubs;
41 break;
42 case Instruction::DIV_FLOAT_2ADDR:
43 case Instruction::DIV_FLOAT:
44 op = kThumb2Vdivs;
45 break;
46 case Instruction::MUL_FLOAT_2ADDR:
47 case Instruction::MUL_FLOAT:
48 op = kThumb2Vmuls;
49 break;
50 case Instruction::REM_FLOAT_2ADDR:
51 case Instruction::REM_FLOAT:
52 case Instruction::NEG_FLOAT: {
buzbee408ad162012-06-06 16:45:18 -070053 return genArithOpFloatPortable(cUnit, opcode, rlDest, rlSrc1, rlSrc2);
buzbee67bf8852011-08-17 17:51:35 -070054 }
Bill Buzbeea114add2012-05-03 15:00:40 -070055 default:
56 return true;
57 }
58 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
59 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
60 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
buzbeecbd6d442012-11-17 14:11:25 -080061 newLIR3(cUnit, op, rlResult.lowReg, rlSrc1.lowReg, rlSrc2.lowReg);
Bill Buzbeea114add2012-05-03 15:00:40 -070062 storeValue(cUnit, rlDest, rlResult);
63 return false;
buzbee67bf8852011-08-17 17:51:35 -070064}
65
buzbee408ad162012-06-06 16:45:18 -070066bool genArithOpDouble(CompilationUnit* cUnit, Instruction::Code opcode,
67 RegLocation rlDest, RegLocation rlSrc1, RegLocation rlSrc2)
buzbee67bf8852011-08-17 17:51:35 -070068{
Bill Buzbeea114add2012-05-03 15:00:40 -070069 int op = kThumbBkpt;
70 RegLocation rlResult;
buzbee67bf8852011-08-17 17:51:35 -070071
buzbee408ad162012-06-06 16:45:18 -070072 switch (opcode) {
Bill Buzbeea114add2012-05-03 15:00:40 -070073 case Instruction::ADD_DOUBLE_2ADDR:
74 case Instruction::ADD_DOUBLE:
75 op = kThumb2Vaddd;
76 break;
77 case Instruction::SUB_DOUBLE_2ADDR:
78 case Instruction::SUB_DOUBLE:
79 op = kThumb2Vsubd;
80 break;
81 case Instruction::DIV_DOUBLE_2ADDR:
82 case Instruction::DIV_DOUBLE:
83 op = kThumb2Vdivd;
84 break;
85 case Instruction::MUL_DOUBLE_2ADDR:
86 case Instruction::MUL_DOUBLE:
87 op = kThumb2Vmuld;
88 break;
89 case Instruction::REM_DOUBLE_2ADDR:
90 case Instruction::REM_DOUBLE:
91 case Instruction::NEG_DOUBLE: {
buzbee408ad162012-06-06 16:45:18 -070092 return genArithOpDoublePortable(cUnit, opcode, rlDest, rlSrc1, rlSrc2);
buzbee67bf8852011-08-17 17:51:35 -070093 }
Bill Buzbeea114add2012-05-03 15:00:40 -070094 default:
95 return true;
96 }
buzbee67bf8852011-08-17 17:51:35 -070097
Bill Buzbeea114add2012-05-03 15:00:40 -070098 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
99 DCHECK(rlSrc1.wide);
100 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
101 DCHECK(rlSrc2.wide);
102 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
103 DCHECK(rlDest.wide);
104 DCHECK(rlResult.wide);
buzbeecbd6d442012-11-17 14:11:25 -0800105 newLIR3(cUnit, op, s2d(rlResult.lowReg, rlResult.highReg), s2d(rlSrc1.lowReg, rlSrc1.highReg),
buzbeef0504cd2012-11-13 16:31:10 -0800106 s2d(rlSrc2.lowReg, rlSrc2.highReg));
Bill Buzbeea114add2012-05-03 15:00:40 -0700107 storeValueWide(cUnit, rlDest, rlResult);
108 return false;
buzbee67bf8852011-08-17 17:51:35 -0700109}
110
buzbee408ad162012-06-06 16:45:18 -0700111bool genConversion(CompilationUnit* cUnit, Instruction::Code opcode,
112 RegLocation rlDest, RegLocation rlSrc)
buzbee67bf8852011-08-17 17:51:35 -0700113{
Bill Buzbeea114add2012-05-03 15:00:40 -0700114 int op = kThumbBkpt;
Bill Buzbeea114add2012-05-03 15:00:40 -0700115 int srcReg;
Bill Buzbeea114add2012-05-03 15:00:40 -0700116 RegLocation rlResult;
buzbee67bf8852011-08-17 17:51:35 -0700117
Bill Buzbeea114add2012-05-03 15:00:40 -0700118 switch (opcode) {
119 case Instruction::INT_TO_FLOAT:
Bill Buzbeea114add2012-05-03 15:00:40 -0700120 op = kThumb2VcvtIF;
121 break;
122 case Instruction::FLOAT_TO_INT:
Bill Buzbeea114add2012-05-03 15:00:40 -0700123 op = kThumb2VcvtFI;
124 break;
125 case Instruction::DOUBLE_TO_FLOAT:
Bill Buzbeea114add2012-05-03 15:00:40 -0700126 op = kThumb2VcvtDF;
127 break;
128 case Instruction::FLOAT_TO_DOUBLE:
Bill Buzbeea114add2012-05-03 15:00:40 -0700129 op = kThumb2VcvtFd;
130 break;
131 case Instruction::INT_TO_DOUBLE:
Bill Buzbeea114add2012-05-03 15:00:40 -0700132 op = kThumb2VcvtID;
133 break;
134 case Instruction::DOUBLE_TO_INT:
Bill Buzbeea114add2012-05-03 15:00:40 -0700135 op = kThumb2VcvtDI;
136 break;
137 case Instruction::LONG_TO_DOUBLE:
138 case Instruction::FLOAT_TO_LONG:
139 case Instruction::LONG_TO_FLOAT:
140 case Instruction::DOUBLE_TO_LONG:
buzbee408ad162012-06-06 16:45:18 -0700141 return genConversionPortable(cUnit, opcode, rlDest, rlSrc);
Bill Buzbeea114add2012-05-03 15:00:40 -0700142 default:
143 return true;
144 }
buzbee408ad162012-06-06 16:45:18 -0700145 if (rlSrc.wide) {
Bill Buzbeea114add2012-05-03 15:00:40 -0700146 rlSrc = loadValueWide(cUnit, rlSrc, kFPReg);
buzbeef0504cd2012-11-13 16:31:10 -0800147 srcReg = s2d(rlSrc.lowReg, rlSrc.highReg);
Bill Buzbeea114add2012-05-03 15:00:40 -0700148 } else {
Bill Buzbeea114add2012-05-03 15:00:40 -0700149 rlSrc = loadValue(cUnit, rlSrc, kFPReg);
150 srcReg = rlSrc.lowReg;
151 }
buzbee408ad162012-06-06 16:45:18 -0700152 if (rlDest.wide) {
Bill Buzbeea114add2012-05-03 15:00:40 -0700153 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
buzbeecbd6d442012-11-17 14:11:25 -0800154 newLIR2(cUnit, op, s2d(rlResult.lowReg, rlResult.highReg), srcReg);
Bill Buzbeea114add2012-05-03 15:00:40 -0700155 storeValueWide(cUnit, rlDest, rlResult);
156 } else {
Bill Buzbeea114add2012-05-03 15:00:40 -0700157 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
buzbeecbd6d442012-11-17 14:11:25 -0800158 newLIR2(cUnit, op, rlResult.lowReg, srcReg);
Bill Buzbeea114add2012-05-03 15:00:40 -0700159 storeValue(cUnit, rlDest, rlResult);
160 }
161 return false;
buzbee67bf8852011-08-17 17:51:35 -0700162}
163
buzbee84fd6932012-03-29 16:44:16 -0700164void genFusedFPCmpBranch(CompilationUnit* cUnit, BasicBlock* bb, MIR* mir,
165 bool gtBias, bool isDouble)
166{
buzbeea1da8a52012-07-09 14:00:21 -0700167 LIR* labelList = cUnit->blockLabelList;
Bill Buzbeea114add2012-05-03 15:00:40 -0700168 LIR* target = &labelList[bb->taken->id];
169 RegLocation rlSrc1;
170 RegLocation rlSrc2;
171 if (isDouble) {
buzbee15bf9802012-06-12 17:49:27 -0700172 rlSrc1 = oatGetSrcWide(cUnit, mir, 0);
173 rlSrc2 = oatGetSrcWide(cUnit, mir, 2);
Bill Buzbeea114add2012-05-03 15:00:40 -0700174 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
175 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
buzbeef0504cd2012-11-13 16:31:10 -0800176 newLIR2(cUnit, kThumb2Vcmpd, s2d(rlSrc1.lowReg, rlSrc2.highReg),
177 s2d(rlSrc2.lowReg, rlSrc2.highReg));
Bill Buzbeea114add2012-05-03 15:00:40 -0700178 } else {
179 rlSrc1 = oatGetSrc(cUnit, mir, 0);
180 rlSrc2 = oatGetSrc(cUnit, mir, 1);
181 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
182 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
183 newLIR2(cUnit, kThumb2Vcmps, rlSrc1.lowReg, rlSrc2.lowReg);
184 }
185 newLIR0(cUnit, kThumb2Fmstat);
186 ConditionCode ccode = static_cast<ConditionCode>(mir->dalvikInsn.arg[0]);
187 switch(ccode) {
188 case kCondEq:
189 case kCondNe:
190 break;
191 case kCondLt:
192 if (gtBias) {
193 ccode = kCondMi;
194 }
195 break;
196 case kCondLe:
197 if (gtBias) {
198 ccode = kCondLs;
199 }
200 break;
201 case kCondGt:
202 if (gtBias) {
203 ccode = kCondHi;
204 }
205 break;
206 case kCondGe:
207 if (gtBias) {
208 ccode = kCondCs;
209 }
210 break;
211 default:
buzbeecbd6d442012-11-17 14:11:25 -0800212 LOG(FATAL) << "Unexpected ccode: " << ccode;
Bill Buzbeea114add2012-05-03 15:00:40 -0700213 }
214 opCondBranch(cUnit, ccode, target);
buzbee84fd6932012-03-29 16:44:16 -0700215}
216
217
buzbee408ad162012-06-06 16:45:18 -0700218bool genCmpFP(CompilationUnit* cUnit, Instruction::Code opcode, RegLocation rlDest,
Bill Buzbeea114add2012-05-03 15:00:40 -0700219 RegLocation rlSrc1, RegLocation rlSrc2)
buzbee67bf8852011-08-17 17:51:35 -0700220{
Bill Buzbeea114add2012-05-03 15:00:40 -0700221 bool isDouble;
222 int defaultResult;
223 RegLocation rlResult;
buzbee67bf8852011-08-17 17:51:35 -0700224
buzbee408ad162012-06-06 16:45:18 -0700225 switch (opcode) {
Bill Buzbeea114add2012-05-03 15:00:40 -0700226 case Instruction::CMPL_FLOAT:
227 isDouble = false;
228 defaultResult = -1;
229 break;
230 case Instruction::CMPG_FLOAT:
231 isDouble = false;
232 defaultResult = 1;
233 break;
234 case Instruction::CMPL_DOUBLE:
235 isDouble = true;
236 defaultResult = -1;
237 break;
238 case Instruction::CMPG_DOUBLE:
239 isDouble = true;
240 defaultResult = 1;
241 break;
242 default:
243 return true;
244 }
245 if (isDouble) {
246 rlSrc1 = loadValueWide(cUnit, rlSrc1, kFPReg);
247 rlSrc2 = loadValueWide(cUnit, rlSrc2, kFPReg);
248 oatClobberSReg(cUnit, rlDest.sRegLow);
249 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
250 loadConstant(cUnit, rlResult.lowReg, defaultResult);
buzbeef0504cd2012-11-13 16:31:10 -0800251 newLIR2(cUnit, kThumb2Vcmpd, s2d(rlSrc1.lowReg, rlSrc2.highReg),
252 s2d(rlSrc2.lowReg, rlSrc2.highReg));
Bill Buzbeea114add2012-05-03 15:00:40 -0700253 } else {
254 rlSrc1 = loadValue(cUnit, rlSrc1, kFPReg);
255 rlSrc2 = loadValue(cUnit, rlSrc2, kFPReg);
256 oatClobberSReg(cUnit, rlDest.sRegLow);
257 rlResult = oatEvalLoc(cUnit, rlDest, kCoreReg, true);
258 loadConstant(cUnit, rlResult.lowReg, defaultResult);
259 newLIR2(cUnit, kThumb2Vcmps, rlSrc1.lowReg, rlSrc2.lowReg);
260 }
buzbeef0504cd2012-11-13 16:31:10 -0800261 DCHECK(!ARM_FPREG(rlResult.lowReg));
Bill Buzbeea114add2012-05-03 15:00:40 -0700262 newLIR0(cUnit, kThumb2Fmstat);
buzbee67bf8852011-08-17 17:51:35 -0700263
Bill Buzbeea114add2012-05-03 15:00:40 -0700264 opIT(cUnit, (defaultResult == -1) ? kArmCondGt : kArmCondMi, "");
265 newLIR2(cUnit, kThumb2MovImmShift, rlResult.lowReg,
266 modifiedImmediate(-defaultResult)); // Must not alter ccodes
267 genBarrier(cUnit);
buzbee67bf8852011-08-17 17:51:35 -0700268
Bill Buzbeea114add2012-05-03 15:00:40 -0700269 opIT(cUnit, kArmCondEq, "");
270 loadConstant(cUnit, rlResult.lowReg, 0);
271 genBarrier(cUnit);
buzbee67bf8852011-08-17 17:51:35 -0700272
Bill Buzbeea114add2012-05-03 15:00:40 -0700273 storeValue(cUnit, rlDest, rlResult);
274 return false;
buzbee67bf8852011-08-17 17:51:35 -0700275}
Elliott Hughes11d1b0c2012-01-23 16:57:47 -0800276
buzbeeefc63692012-11-14 16:31:52 -0800277void genNegFloat(CompilationUnit* cUnit, RegLocation rlDest, RegLocation rlSrc)
278{
279 RegLocation rlResult;
280 rlSrc = loadValue(cUnit, rlSrc, kFPReg);
281 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
282 newLIR2(cUnit, kThumb2Vnegs, rlResult.lowReg, rlSrc.lowReg);
283 storeValue(cUnit, rlDest, rlResult);
284}
285
286void genNegDouble(CompilationUnit* cUnit, RegLocation rlDest, RegLocation rlSrc)
287{
288 RegLocation rlResult;
289 rlSrc = loadValueWide(cUnit, rlSrc, kFPReg);
290 rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
291 newLIR2(cUnit, kThumb2Vnegd, s2d(rlResult.lowReg, rlResult.highReg),
292 s2d(rlSrc.lowReg, rlSrc.highReg));
293 storeValueWide(cUnit, rlDest, rlResult);
294}
295
296bool genInlinedSqrt(CompilationUnit* cUnit, CallInfo* info) {
297 DCHECK_EQ(cUnit->instructionSet, kThumb2);
298 LIR *branch;
299 RegLocation rlSrc = info->args[0];
300 RegLocation rlDest = inlineTargetWide(cUnit, info); // double place for result
301 rlSrc = loadValueWide(cUnit, rlSrc, kFPReg);
302 RegLocation rlResult = oatEvalLoc(cUnit, rlDest, kFPReg, true);
303 newLIR2(cUnit, kThumb2Vsqrtd, s2d(rlResult.lowReg, rlResult.highReg),
304 s2d(rlSrc.lowReg, rlSrc.highReg));
305 newLIR2(cUnit, kThumb2Vcmpd, s2d(rlResult.lowReg, rlResult.highReg),
306 s2d(rlResult.lowReg, rlResult.highReg));
307 newLIR0(cUnit, kThumb2Fmstat);
308 branch = newLIR2(cUnit, kThumbBCond, 0, kArmCondEq);
309 oatClobberCalleeSave(cUnit);
310 oatLockCallTemps(cUnit); // Using fixed registers
311 int rTgt = loadHelper(cUnit, ENTRYPOINT_OFFSET(pSqrt));
312 newLIR3(cUnit, kThumb2Fmrrd, r0, r1, s2d(rlSrc.lowReg, rlSrc.highReg));
313 newLIR1(cUnit, kThumbBlxR, rTgt);
314 newLIR3(cUnit, kThumb2Fmdrr, s2d(rlResult.lowReg, rlResult.highReg), r0, r1);
315 branch->target = newLIR0(cUnit, kPseudoTargetLabel);
316 storeValueWide(cUnit, rlDest, rlResult);
317 return true;
318}
319
320
Elliott Hughes11d1b0c2012-01-23 16:57:47 -0800321} // namespace art