blob: 9b0bdd8505ec229eee9c79f7a2fb8e2521465d3c [file] [log] [blame]
Richard Sandifordbdbb8af2013-08-05 10:58:53 +00001//===-- SystemZElimCompare.cpp - Eliminate comparison instructions --------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This pass:
11// (1) tries to remove compares if CC already contains the required information
12// (2) fuses compares and branches into COMPARE AND BRANCH instructions
13//
14//===----------------------------------------------------------------------===//
15
16#define DEBUG_TYPE "systemz-elim-compare"
17
18#include "SystemZTargetMachine.h"
19#include "llvm/ADT/Statistic.h"
20#include "llvm/CodeGen/MachineFunctionPass.h"
21#include "llvm/CodeGen/MachineInstrBuilder.h"
22#include "llvm/IR/Function.h"
23#include "llvm/Support/CommandLine.h"
24#include "llvm/Support/MathExtras.h"
25#include "llvm/Target/TargetInstrInfo.h"
26#include "llvm/Target/TargetMachine.h"
27#include "llvm/Target/TargetRegisterInfo.h"
28
29using namespace llvm;
30
31STATISTIC(EliminatedComparisons, "Number of eliminated comparisons");
32STATISTIC(FusedComparisons, "Number of fused compare-and-branch instructions");
33
34namespace {
35 class SystemZElimCompare : public MachineFunctionPass {
36 public:
37 static char ID;
38 SystemZElimCompare(const SystemZTargetMachine &tm)
39 : MachineFunctionPass(ID), TII(0), TRI(0) {}
40
41 virtual const char *getPassName() const {
42 return "SystemZ Comparison Elimination";
43 }
44
45 bool processBlock(MachineBasicBlock *MBB);
46 bool runOnMachineFunction(MachineFunction &F);
47
48 private:
49 bool adjustCCMasksForInstr(MachineInstr *MI, MachineInstr *Compare,
50 SmallVectorImpl<MachineInstr *> &CCUsers);
51 bool optimizeCompareZero(MachineInstr *Compare,
52 SmallVectorImpl<MachineInstr *> &CCUsers);
53 bool fuseCompareAndBranch(MachineInstr *Compare,
54 SmallVectorImpl<MachineInstr *> &CCUsers);
55
56 const SystemZInstrInfo *TII;
57 const TargetRegisterInfo *TRI;
58 };
59
60 char SystemZElimCompare::ID = 0;
61} // end of anonymous namespace
62
63FunctionPass *llvm::createSystemZElimComparePass(SystemZTargetMachine &TM) {
64 return new SystemZElimCompare(TM);
65}
66
67// Return true if CC is live out of MBB.
68static bool isCCLiveOut(MachineBasicBlock *MBB) {
69 for (MachineBasicBlock::succ_iterator SI = MBB->succ_begin(),
70 SE = MBB->succ_end(); SI != SE; ++SI)
71 if ((*SI)->isLiveIn(SystemZ::CC))
72 return true;
73 return false;
74}
75
76// Return true if any CC result of MI would reflect the value of subreg
77// SubReg of Reg.
78static bool resultTests(MachineInstr *MI, unsigned Reg, unsigned SubReg) {
79 if (MI->getNumOperands() > 0 &&
80 MI->getOperand(0).isReg() &&
81 MI->getOperand(0).isDef() &&
82 MI->getOperand(0).getReg() == Reg &&
83 MI->getOperand(0).getSubReg() == SubReg)
84 return true;
85
86 return false;
87}
88
89// The CC users in CCUsers are testing the result of a comparison of some
90// value X against zero and we know that any CC value produced by MI
91// would also reflect the value of X. Try to adjust CCUsers so that
92// they test the result of MI directly, returning true on success.
93// Leave everything unchanged on failure.
94bool SystemZElimCompare::
95adjustCCMasksForInstr(MachineInstr *MI, MachineInstr *Compare,
96 SmallVectorImpl<MachineInstr *> &CCUsers) {
97 int Opcode = MI->getOpcode();
98 const MCInstrDesc &Desc = TII->get(Opcode);
99 unsigned MIFlags = Desc.TSFlags;
100
101 // See which compare-style condition codes are available.
102 unsigned ReusableCCMask = 0;
103 if (MIFlags & SystemZII::CCHasZero)
104 ReusableCCMask |= SystemZ::CCMASK_CMP_EQ;
105
106 // For unsigned comparisons with zero, only equality makes sense.
107 unsigned CompareFlags = Compare->getDesc().TSFlags;
108 if (!(CompareFlags & SystemZII::IsLogical) &&
109 (MIFlags & SystemZII::CCHasOrder))
110 ReusableCCMask |= SystemZ::CCMASK_CMP_LT | SystemZ::CCMASK_CMP_GT;
111
112 if (ReusableCCMask == 0)
113 return false;
114
115 unsigned CCValues = SystemZII::getCCValues(MIFlags);
116 assert((ReusableCCMask & ~CCValues) == 0 && "Invalid CCValues");
117
118 // Now check whether these flags are enough for all users.
119 SmallVector<MachineOperand *, 4> AlterMasks;
120 for (unsigned int I = 0, E = CCUsers.size(); I != E; ++I) {
121 MachineInstr *MI = CCUsers[I];
122
123 // Fail if this isn't a use of CC that we understand.
124 unsigned Flags = MI->getDesc().TSFlags;
125 unsigned FirstOpNum;
126 if (Flags & SystemZII::CCMaskFirst)
127 FirstOpNum = 0;
128 else if (Flags & SystemZII::CCMaskLast)
129 FirstOpNum = MI->getNumExplicitOperands() - 2;
130 else
131 return false;
132
133 // Check whether the instruction predicate treats all CC values
134 // outside of ReusableCCMask in the same way. In that case it
135 // doesn't matter what those CC values mean.
136 unsigned CCValid = MI->getOperand(FirstOpNum).getImm();
137 unsigned CCMask = MI->getOperand(FirstOpNum + 1).getImm();
138 unsigned OutValid = ~ReusableCCMask & CCValid;
139 unsigned OutMask = ~ReusableCCMask & CCMask;
140 if (OutMask != 0 && OutMask != OutValid)
141 return false;
142
143 AlterMasks.push_back(&MI->getOperand(FirstOpNum));
144 AlterMasks.push_back(&MI->getOperand(FirstOpNum + 1));
145 }
146
147 // All users are OK. Adjust the masks for MI.
148 for (unsigned I = 0, E = AlterMasks.size(); I != E; I += 2) {
149 AlterMasks[I]->setImm(CCValues);
150 unsigned CCMask = AlterMasks[I + 1]->getImm();
151 if (CCMask & ~ReusableCCMask)
152 AlterMasks[I + 1]->setImm((CCMask & ReusableCCMask) |
153 (CCValues & ~ReusableCCMask));
154 }
155
156 // CC is now live after MI.
157 int CCDef = MI->findRegisterDefOperandIdx(SystemZ::CC, false, true, TRI);
158 assert(CCDef >= 0 && "Couldn't find CC set");
159 MI->getOperand(CCDef).setIsDead(false);
160
161 // Clear any intervening kills of CC.
162 MachineBasicBlock::iterator MBBI = MI, MBBE = Compare;
163 for (++MBBI; MBBI != MBBE; ++MBBI)
164 MBBI->clearRegisterKills(SystemZ::CC, TRI);
165
166 return true;
167}
168
169// Try to optimize cases where comparison instruction Compare is testing
170// a value against zero. Return true on success and if Compare should be
171// deleted as dead. CCUsers is the list of instructions that use the CC
172// value produced by Compare.
173bool SystemZElimCompare::
174optimizeCompareZero(MachineInstr *Compare,
175 SmallVectorImpl<MachineInstr *> &CCUsers) {
176 // Check whether this is a comparison against zero.
177 if (Compare->getNumExplicitOperands() != 2 ||
178 !Compare->getOperand(1).isImm() ||
179 Compare->getOperand(1).getImm() != 0)
180 return false;
181
182 // Search back for CC results that are based on the first operand.
183 unsigned SrcReg = Compare->getOperand(0).getReg();
184 unsigned SrcSubReg = Compare->getOperand(0).getSubReg();
185 MachineBasicBlock *MBB = Compare->getParent();
186 MachineBasicBlock::iterator MBBI = Compare, MBBE = MBB->begin();
187 while (MBBI != MBBE) {
188 --MBBI;
189 MachineInstr *MI = MBBI;
190 if (resultTests(MI, SrcReg, SrcSubReg) &&
191 adjustCCMasksForInstr(MI, Compare, CCUsers)) {
192 EliminatedComparisons += 1;
193 return true;
194 }
195 if (MI->modifiesRegister(SrcReg, TRI) ||
196 MI->modifiesRegister(SystemZ::CC, TRI))
197 return false;
198 }
199 return false;
200}
201
202// Try to fuse comparison instruction Compare into a later branch.
203// Return true on success and if Compare is therefore redundant.
204bool SystemZElimCompare::
205fuseCompareAndBranch(MachineInstr *Compare,
206 SmallVectorImpl<MachineInstr *> &CCUsers) {
207 // See whether we have a comparison that can be fused.
208 unsigned FusedOpcode = TII->getCompareAndBranch(Compare->getOpcode(),
209 Compare);
210 if (!FusedOpcode)
211 return false;
212
213 // See whether we have a single branch with which to fuse.
214 if (CCUsers.size() != 1)
215 return false;
216 MachineInstr *Branch = CCUsers[0];
217 if (Branch->getOpcode() != SystemZ::BRC)
218 return false;
219
220 // Make sure that the operands are available at the branch.
221 unsigned SrcReg = Compare->getOperand(0).getReg();
222 unsigned SrcReg2 = (Compare->getOperand(1).isReg() ?
223 Compare->getOperand(1).getReg() : 0);
224 MachineBasicBlock::iterator MBBI = Compare, MBBE = Branch;
225 for (++MBBI; MBBI != MBBE; ++MBBI)
226 if (MBBI->modifiesRegister(SrcReg, TRI) ||
227 (SrcReg2 && MBBI->modifiesRegister(SrcReg2, TRI)))
228 return false;
229
230 // Read the branch mask and target.
231 MachineOperand CCMask(MBBI->getOperand(1));
232 MachineOperand Target(MBBI->getOperand(2));
233 assert((CCMask.getImm() & ~SystemZ::CCMASK_ICMP) == 0 &&
234 "Invalid condition-code mask for integer comparison");
235
236 // Clear out all current operands.
237 int CCUse = MBBI->findRegisterUseOperandIdx(SystemZ::CC, false, TRI);
238 assert(CCUse >= 0 && "BRC must use CC");
239 Branch->RemoveOperand(CCUse);
240 Branch->RemoveOperand(2);
241 Branch->RemoveOperand(1);
242 Branch->RemoveOperand(0);
243
244 // Rebuild Branch as a fused compare and branch.
245 Branch->setDesc(TII->get(FusedOpcode));
246 MachineInstrBuilder(*Branch->getParent()->getParent(), Branch)
247 .addOperand(Compare->getOperand(0))
248 .addOperand(Compare->getOperand(1))
249 .addOperand(CCMask)
250 .addOperand(Target)
251 .addReg(SystemZ::CC, RegState::ImplicitDefine);
252
253 // Clear any intervening kills of SrcReg and SrcReg2.
254 MBBI = Compare;
255 for (++MBBI; MBBI != MBBE; ++MBBI) {
256 MBBI->clearRegisterKills(SrcReg, TRI);
257 if (SrcReg2)
258 MBBI->clearRegisterKills(SrcReg2, TRI);
259 }
260 FusedComparisons += 1;
261 return true;
262}
263
264// Process all comparison instructions in MBB. Return true if something
265// changed.
266bool SystemZElimCompare::processBlock(MachineBasicBlock *MBB) {
267 bool Changed = false;
268
269 // Walk backwards through the block looking for comparisons, recording
270 // all CC users as we go. The subroutines can delete Compare and
271 // instructions before it.
272 bool CompleteCCUsers = !isCCLiveOut(MBB);
273 SmallVector<MachineInstr *, 4> CCUsers;
274 MachineBasicBlock::iterator MBBI = MBB->end();
275 while (MBBI != MBB->begin()) {
276 MachineInstr *MI = --MBBI;
277 if (CompleteCCUsers &&
278 MI->isCompare() &&
279 (optimizeCompareZero(MI, CCUsers) ||
280 fuseCompareAndBranch(MI, CCUsers))) {
281 ++MBBI;
282 MI->removeFromParent();
283 Changed = true;
284 CCUsers.clear();
285 CompleteCCUsers = true;
286 continue;
287 }
288
289 if (MI->definesRegister(SystemZ::CC, TRI)) {
290 CCUsers.clear();
291 CompleteCCUsers = true;
292 } else if (MI->modifiesRegister(SystemZ::CC, TRI))
293 CompleteCCUsers = false;
294
295 if (CompleteCCUsers && MI->readsRegister(SystemZ::CC, TRI))
296 CCUsers.push_back(MI);
297 }
298 return Changed;
299}
300
301bool SystemZElimCompare::runOnMachineFunction(MachineFunction &F) {
302 TII = static_cast<const SystemZInstrInfo *>(F.getTarget().getInstrInfo());
303 TRI = &TII->getRegisterInfo();
304
305 bool Changed = false;
306 for (MachineFunction::iterator MFI = F.begin(), MFE = F.end();
307 MFI != MFE; ++MFI)
308 Changed |= processBlock(MFI);
309
310 return Changed;
311}