blob: f8dfe6d82c5100b4cc518224af47a811b3f273a6 [file] [log] [blame]
Chris Lattner36e646c2010-02-24 07:06:50 +00001//===- DAGISelMatcherOpt.cpp - Optimize a DAG Matcher ---------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the DAG Matcher optimizer.
11//
12//===----------------------------------------------------------------------===//
13
Chris Lattnerddfd5ab2010-02-27 07:49:13 +000014#define DEBUG_TYPE "isel-opt"
Chris Lattner36e646c2010-02-24 07:06:50 +000015#include "DAGISelMatcher.h"
Chris Lattner5cc7a832010-02-28 20:49:53 +000016#include "CodeGenDAGPatterns.h"
Chris Lattnercd632fb2010-02-25 07:45:24 +000017#include "llvm/ADT/DenseMap.h"
Chris Lattnerddfd5ab2010-02-27 07:49:13 +000018#include "llvm/Support/Debug.h"
19#include "llvm/Support/raw_ostream.h"
Chris Lattnercd632fb2010-02-25 07:45:24 +000020#include <vector>
Chris Lattner36e646c2010-02-24 07:06:50 +000021using namespace llvm;
22
Chris Lattnerf4950d02010-02-27 06:22:57 +000023/// ContractNodes - Turn multiple matcher node patterns like 'MoveChild+Record'
24/// into single compound nodes like RecordChild.
Chris Lattner5cc7a832010-02-28 20:49:53 +000025static void ContractNodes(OwningPtr<Matcher> &MatcherPtr,
26 const CodeGenDAGPatterns &CGP) {
Chris Lattner3ee1bc42010-02-24 07:31:45 +000027 // If we reached the end of the chain, we're done.
Chris Lattner9a515172010-02-25 02:04:40 +000028 Matcher *N = MatcherPtr.get();
Chris Lattner3ee1bc42010-02-24 07:31:45 +000029 if (N == 0) return;
30
Chris Lattner42363662010-02-25 19:00:39 +000031 // If we have a scope node, walk down all of the children.
32 if (ScopeMatcher *Scope = dyn_cast<ScopeMatcher>(N)) {
33 for (unsigned i = 0, e = Scope->getNumChildren(); i != e; ++i) {
34 OwningPtr<Matcher> Child(Scope->takeChild(i));
Chris Lattner5cc7a832010-02-28 20:49:53 +000035 ContractNodes(Child, CGP);
Chris Lattner42363662010-02-25 19:00:39 +000036 Scope->resetChild(i, Child.take());
37 }
38 return;
39 }
Chris Lattner3ee1bc42010-02-24 07:31:45 +000040
Chris Lattner9feb1e32010-02-24 19:52:48 +000041 // If we found a movechild node with a node that comes in a 'foochild' form,
42 // transform it.
Chris Lattner9a515172010-02-25 02:04:40 +000043 if (MoveChildMatcher *MC = dyn_cast<MoveChildMatcher>(N)) {
44 Matcher *New = 0;
45 if (RecordMatcher *RM = dyn_cast<RecordMatcher>(MC->getNext()))
Chris Lattner5377f912010-03-01 02:24:17 +000046 New = new RecordChildMatcher(MC->getChildNo(), RM->getWhatFor(),
47 RM->getResultNo());
Chris Lattner3c664b32010-02-24 20:15:25 +000048
Chris Lattner9a515172010-02-25 02:04:40 +000049 if (CheckTypeMatcher *CT= dyn_cast<CheckTypeMatcher>(MC->getNext()))
50 New = new CheckChildTypeMatcher(MC->getChildNo(), CT->getType());
Chris Lattner3c664b32010-02-24 20:15:25 +000051
52 if (New) {
53 // Insert the new node.
Chris Lattnerac10e4f2010-02-25 01:56:48 +000054 New->setNext(MatcherPtr.take());
55 MatcherPtr.reset(New);
Chris Lattner3c664b32010-02-24 20:15:25 +000056 // Remove the old one.
57 MC->setNext(MC->getNext()->takeNext());
Chris Lattner5cc7a832010-02-28 20:49:53 +000058 return ContractNodes(MatcherPtr, CGP);
Chris Lattner9feb1e32010-02-24 19:52:48 +000059 }
Chris Lattner3ee1bc42010-02-24 07:31:45 +000060 }
Chris Lattner9feb1e32010-02-24 19:52:48 +000061
Chris Lattner7a1dab42010-02-28 02:31:26 +000062 // Zap movechild -> moveparent.
Chris Lattner9a515172010-02-25 02:04:40 +000063 if (MoveChildMatcher *MC = dyn_cast<MoveChildMatcher>(N))
64 if (MoveParentMatcher *MP =
65 dyn_cast<MoveParentMatcher>(MC->getNext())) {
Chris Lattnerac10e4f2010-02-25 01:56:48 +000066 MatcherPtr.reset(MP->takeNext());
Chris Lattner5cc7a832010-02-28 20:49:53 +000067 return ContractNodes(MatcherPtr, CGP);
Chris Lattner9feb1e32010-02-24 19:52:48 +000068 }
Chris Lattner1f5ca1e2010-02-28 23:00:47 +000069
70 // FIXME: Handle OPC_MarkFlagResults.
71
Chris Lattner7dae4af2010-02-28 20:55:18 +000072 // Turn EmitNode->CompleteMatch into MorphNodeTo if we can.
Chris Lattner7a1dab42010-02-28 02:31:26 +000073 if (EmitNodeMatcher *EN = dyn_cast<EmitNodeMatcher>(N))
Chris Lattner19a1fbe2010-02-28 02:41:25 +000074 if (CompleteMatchMatcher *CM =
75 dyn_cast<CompleteMatchMatcher>(EN->getNext())) {
Chris Lattner7dae4af2010-02-28 20:55:18 +000076 // We can only use MorphNodeTo if the result values match up.
Chris Lattner5cc7a832010-02-28 20:49:53 +000077 unsigned RootResultFirst = EN->getFirstResultSlot();
78 bool ResultsMatch = true;
79 for (unsigned i = 0, e = CM->getNumResults(); i != e; ++i)
80 if (CM->getResult(i) != RootResultFirst+i)
81 ResultsMatch = false;
82
83 // If the selected node defines a subset of the flag/chain results, we
Chris Lattner7dae4af2010-02-28 20:55:18 +000084 // can't use MorphNodeTo. For example, we can't use MorphNodeTo if the
Chris Lattner5cc7a832010-02-28 20:49:53 +000085 // matched pattern has a chain but the root node doesn't.
86 const PatternToMatch &Pattern = CM->getPattern();
87
88 if (!EN->hasChain() &&
89 Pattern.getSrcPattern()->NodeHasProperty(SDNPHasChain, CGP))
90 ResultsMatch = false;
91
92 // If the matched node has a flag and the output root doesn't, we can't
Chris Lattner7dae4af2010-02-28 20:55:18 +000093 // use MorphNodeTo.
Chris Lattner5cc7a832010-02-28 20:49:53 +000094 //
95 // NOTE: Strictly speaking, we don't have to check for the flag here
96 // because the code in the pattern generator doesn't handle it right. We
97 // do it anyway for thoroughness.
Chris Lattner414bac82010-02-28 21:53:42 +000098 if (!EN->hasOutFlag() &&
Chris Lattner5cc7a832010-02-28 20:49:53 +000099 Pattern.getSrcPattern()->NodeHasProperty(SDNPOutFlag, CGP))
100 ResultsMatch = false;
101
102
103 // If the root result node defines more results than the source root node
104 // *and* has a chain or flag input, then we can't match it because it
105 // would end up replacing the extra result with the chain/flag.
106#if 0
107 if ((EN->hasFlag() || EN->hasChain()) &&
108 EN->getNumNonChainFlagVTs() > ... need to get no results reliably ...)
109 ResultMatch = false;
110#endif
111
112 if (ResultsMatch) {
113 const SmallVectorImpl<MVT::SimpleValueType> &VTs = EN->getVTList();
114 const SmallVectorImpl<unsigned> &Operands = EN->getOperandList();
Chris Lattner7dae4af2010-02-28 20:55:18 +0000115 MatcherPtr.reset(new MorphNodeToMatcher(EN->getOpcodeName(),
Chris Lattner414bac82010-02-28 21:53:42 +0000116 VTs.data(), VTs.size(),
Chris Lattner7dae4af2010-02-28 20:55:18 +0000117 Operands.data(),Operands.size(),
Chris Lattner414bac82010-02-28 21:53:42 +0000118 EN->hasChain(), EN->hasInFlag(),
119 EN->hasOutFlag(),
Chris Lattner7dae4af2010-02-28 20:55:18 +0000120 EN->hasMemRefs(),
121 EN->getNumFixedArityOperands(),
122 Pattern));
Chris Lattner5cc7a832010-02-28 20:49:53 +0000123 return;
124 }
125
Chris Lattner7dae4af2010-02-28 20:55:18 +0000126 // FIXME2: Kill off all the SelectionDAG::MorphNodeTo and getMachineNode
127 // variants.
Chris Lattner7a1dab42010-02-28 02:31:26 +0000128 }
129
Chris Lattner5cc7a832010-02-28 20:49:53 +0000130 ContractNodes(N->getNextPtr(), CGP);
Chris Lattnere0b45db2010-03-01 02:15:34 +0000131
132
133 // If we have a CheckType/CheckChildType/Record node followed by a
134 // CheckOpcode, invert the two nodes. We prefer to do structural checks
135 // before type checks, as this opens opportunities for factoring on targets
136 // like X86 where many operations are valid on multiple types.
137 if ((isa<CheckTypeMatcher>(N) || isa<CheckChildTypeMatcher>(N) ||
138 isa<RecordMatcher>(N)) &&
139 isa<CheckOpcodeMatcher>(N->getNext())) {
140 // Unlink the two nodes from the list.
141 Matcher *CheckType = MatcherPtr.take();
142 Matcher *CheckOpcode = CheckType->takeNext();
143 Matcher *Tail = CheckOpcode->takeNext();
144
145 // Relink them.
146 MatcherPtr.reset(CheckOpcode);
147 CheckOpcode->setNext(CheckType);
148 CheckType->setNext(Tail);
149 return ContractNodes(MatcherPtr, CGP);
150 }
Chris Lattner3ee1bc42010-02-24 07:31:45 +0000151}
152
Chris Lattnerf4950d02010-02-27 06:22:57 +0000153/// SinkPatternPredicates - Pattern predicates can be checked at any level of
154/// the matching tree. The generator dumps them at the top level of the pattern
155/// though, which prevents factoring from being able to see past them. This
156/// optimization sinks them as far down into the pattern as possible.
157///
158/// Conceptually, we'd like to sink these predicates all the way to the last
159/// matcher predicate in the series. However, it turns out that some
160/// ComplexPatterns have side effects on the graph, so we really don't want to
161/// run a the complex pattern if the pattern predicate will fail. For this
162/// reason, we refuse to sink the pattern predicate past a ComplexPattern.
163///
164static void SinkPatternPredicates(OwningPtr<Matcher> &MatcherPtr) {
165 // Recursively scan for a PatternPredicate.
166 // If we reached the end of the chain, we're done.
167 Matcher *N = MatcherPtr.get();
168 if (N == 0) return;
169
170 // Walk down all members of a scope node.
171 if (ScopeMatcher *Scope = dyn_cast<ScopeMatcher>(N)) {
172 for (unsigned i = 0, e = Scope->getNumChildren(); i != e; ++i) {
173 OwningPtr<Matcher> Child(Scope->takeChild(i));
174 SinkPatternPredicates(Child);
175 Scope->resetChild(i, Child.take());
176 }
177 return;
178 }
179
180 // If this node isn't a CheckPatternPredicateMatcher we keep scanning until
181 // we find one.
182 CheckPatternPredicateMatcher *CPPM =dyn_cast<CheckPatternPredicateMatcher>(N);
183 if (CPPM == 0)
184 return SinkPatternPredicates(N->getNextPtr());
185
186 // Ok, we found one, lets try to sink it. Check if we can sink it past the
187 // next node in the chain. If not, we won't be able to change anything and
188 // might as well bail.
189 if (!CPPM->getNext()->isSafeToReorderWithPatternPredicate())
190 return;
191
192 // Okay, we know we can sink it past at least one node. Unlink it from the
193 // chain and scan for the new insertion point.
194 MatcherPtr.take(); // Don't delete CPPM.
195 MatcherPtr.reset(CPPM->takeNext());
196
197 N = MatcherPtr.get();
198 while (N->getNext()->isSafeToReorderWithPatternPredicate())
199 N = N->getNext();
200
201 // At this point, we want to insert CPPM after N.
202 CPPM->setNext(N->takeNext());
203 N->setNext(CPPM);
204}
205
206/// FactorNodes - Turn matches like this:
207/// Scope
208/// OPC_CheckType i32
209/// ABC
210/// OPC_CheckType i32
211/// XYZ
212/// into:
213/// OPC_CheckType i32
214/// Scope
215/// ABC
216/// XYZ
217///
Chris Lattner9a515172010-02-25 02:04:40 +0000218static void FactorNodes(OwningPtr<Matcher> &MatcherPtr) {
Chris Lattner0acf2ba2010-02-25 01:57:41 +0000219 // If we reached the end of the chain, we're done.
Chris Lattner9a515172010-02-25 02:04:40 +0000220 Matcher *N = MatcherPtr.get();
Chris Lattner0acf2ba2010-02-25 01:57:41 +0000221 if (N == 0) return;
222
223 // If this is not a push node, just scan for one.
Chris Lattner42363662010-02-25 19:00:39 +0000224 ScopeMatcher *Scope = dyn_cast<ScopeMatcher>(N);
225 if (Scope == 0)
Chris Lattner0acf2ba2010-02-25 01:57:41 +0000226 return FactorNodes(N->getNextPtr());
227
Chris Lattner42363662010-02-25 19:00:39 +0000228 // Okay, pull together the children of the scope node into a vector so we can
Chris Lattnercd632fb2010-02-25 07:45:24 +0000229 // inspect it more easily. While we're at it, bucket them up by the hash
230 // code of their first predicate.
Chris Lattner9a515172010-02-25 02:04:40 +0000231 SmallVector<Matcher*, 32> OptionsToMatch;
Chris Lattner0acf2ba2010-02-25 01:57:41 +0000232
Chris Lattner42363662010-02-25 19:00:39 +0000233 for (unsigned i = 0, e = Scope->getNumChildren(); i != e; ++i) {
Chris Lattnercd632fb2010-02-25 07:45:24 +0000234 // Factor the subexpression.
Chris Lattner42363662010-02-25 19:00:39 +0000235 OwningPtr<Matcher> Child(Scope->takeChild(i));
236 FactorNodes(Child);
237
Chris Lattner92a22462010-02-26 08:08:41 +0000238 if (Matcher *N = Child.take())
Chris Lattner42363662010-02-25 19:00:39 +0000239 OptionsToMatch.push_back(N);
Chris Lattnercd632fb2010-02-25 07:45:24 +0000240 }
Chris Lattner0acf2ba2010-02-25 01:57:41 +0000241
Chris Lattnercd632fb2010-02-25 07:45:24 +0000242 SmallVector<Matcher*, 32> NewOptionsToMatch;
243
Chris Lattner92a22462010-02-26 08:08:41 +0000244 // Loop over options to match, merging neighboring patterns with identical
245 // starting nodes into a shared matcher.
Chris Lattnerddfd5ab2010-02-27 07:49:13 +0000246 for (unsigned OptionIdx = 0, e = OptionsToMatch.size(); OptionIdx != e;) {
Chris Lattnercd632fb2010-02-25 07:45:24 +0000247 // Find the set of matchers that start with this node.
Chris Lattnerddfd5ab2010-02-27 07:49:13 +0000248 Matcher *Optn = OptionsToMatch[OptionIdx++];
249
250 if (OptionIdx == e) {
Chris Lattnercd632fb2010-02-25 07:45:24 +0000251 NewOptionsToMatch.push_back(Optn);
252 continue;
253 }
254
Chris Lattnerddfd5ab2010-02-27 07:49:13 +0000255 // See if the next option starts with the same matcher. If the two
256 // neighbors *do* start with the same matcher, we can factor the matcher out
257 // of at least these two patterns. See what the maximal set we can merge
258 // together is.
Chris Lattner92a22462010-02-26 08:08:41 +0000259 SmallVector<Matcher*, 8> EqualMatchers;
260 EqualMatchers.push_back(Optn);
Chris Lattner92a22462010-02-26 08:08:41 +0000261
Chris Lattnerddfd5ab2010-02-27 07:49:13 +0000262 // Factor all of the known-equal matchers after this one into the same
263 // group.
264 while (OptionIdx != e && OptionsToMatch[OptionIdx]->isEqual(Optn))
265 EqualMatchers.push_back(OptionsToMatch[OptionIdx++]);
266
267 // If we found a non-equal matcher, see if it is contradictory with the
268 // current node. If so, we know that the ordering relation between the
269 // current sets of nodes and this node don't matter. Look past it to see if
270 // we can merge anything else into this matching group.
271 unsigned Scan = OptionIdx;
272 while (1) {
273 while (Scan != e && Optn->isContradictory(OptionsToMatch[Scan]))
274 ++Scan;
275
276 // Ok, we found something that isn't known to be contradictory. If it is
277 // equal, we can merge it into the set of nodes to factor, if not, we have
278 // to cease factoring.
279 if (Scan == e || !Optn->isEqual(OptionsToMatch[Scan])) break;
280
281 // If is equal after all, add the option to EqualMatchers and remove it
282 // from OptionsToMatch.
283 EqualMatchers.push_back(OptionsToMatch[Scan]);
284 OptionsToMatch.erase(OptionsToMatch.begin()+Scan);
285 --e;
286 }
287
Chris Lattnere9f720b2010-02-27 21:48:43 +0000288 if (Scan != e &&
289 // Don't print it's obvious nothing extra could be merged anyway.
290 Scan+1 != e) {
Chris Lattner086af322010-02-27 08:11:15 +0000291 DEBUG(errs() << "Couldn't merge this:\n";
292 Optn->print(errs(), 4);
293 errs() << "into this:\n";
294 OptionsToMatch[Scan]->print(errs(), 4);
Chris Lattner53d3ec92010-02-27 08:13:23 +0000295 if (Scan+1 != e)
Chris Lattner086af322010-02-27 08:11:15 +0000296 OptionsToMatch[Scan+1]->printOne(errs());
Chris Lattner53d3ec92010-02-27 08:13:23 +0000297 if (Scan+2 < e)
Chris Lattner086af322010-02-27 08:11:15 +0000298 OptionsToMatch[Scan+2]->printOne(errs());
Chris Lattnerddfd5ab2010-02-27 07:49:13 +0000299 errs() << "\n");
300 }
301
302 // If we only found one option starting with this matcher, no factoring is
303 // possible.
304 if (EqualMatchers.size() == 1) {
305 NewOptionsToMatch.push_back(EqualMatchers[0]);
306 continue;
307 }
Chris Lattner92a22462010-02-26 08:08:41 +0000308
Chris Lattnercd632fb2010-02-25 07:45:24 +0000309 // Factor these checks by pulling the first node off each entry and
Chris Lattnerb0e68102010-02-26 07:36:37 +0000310 // discarding it. Take the first one off the first entry to reuse.
311 Matcher *Shared = Optn;
312 Optn = Optn->takeNext();
313 EqualMatchers[0] = Optn;
314
Chris Lattner92a22462010-02-26 08:08:41 +0000315 // Remove and delete the first node from the other matchers we're factoring.
316 for (unsigned i = 1, e = EqualMatchers.size(); i != e; ++i) {
317 Matcher *Tmp = EqualMatchers[i]->takeNext();
318 delete EqualMatchers[i];
319 EqualMatchers[i] = Tmp;
320 }
Chris Lattnercd632fb2010-02-25 07:45:24 +0000321
Chris Lattnerb0e68102010-02-26 07:36:37 +0000322 Shared->setNext(new ScopeMatcher(&EqualMatchers[0], EqualMatchers.size()));
323
324 // Recursively factor the newly created node.
325 FactorNodes(Shared->getNextPtr());
326
327 NewOptionsToMatch.push_back(Shared);
Chris Lattnercd632fb2010-02-25 07:45:24 +0000328 }
329
330 // Reassemble a new Scope node.
Chris Lattnerb0e68102010-02-26 07:36:37 +0000331 assert(!NewOptionsToMatch.empty() && "where'd all our children go?");
Chris Lattner5cc7a832010-02-28 20:49:53 +0000332 if (NewOptionsToMatch.empty())
333 MatcherPtr.reset(0);
Chris Lattnerb0e68102010-02-26 07:36:37 +0000334 if (NewOptionsToMatch.size() == 1)
335 MatcherPtr.reset(NewOptionsToMatch[0]);
336 else {
337 Scope->setNumChildren(NewOptionsToMatch.size());
338 for (unsigned i = 0, e = NewOptionsToMatch.size(); i != e; ++i)
339 Scope->resetChild(i, NewOptionsToMatch[i]);
340 }
Chris Lattner0acf2ba2010-02-25 01:57:41 +0000341}
342
Chris Lattner5cc7a832010-02-28 20:49:53 +0000343Matcher *llvm::OptimizeMatcher(Matcher *TheMatcher,
344 const CodeGenDAGPatterns &CGP) {
Chris Lattner9a515172010-02-25 02:04:40 +0000345 OwningPtr<Matcher> MatcherPtr(TheMatcher);
Chris Lattner5cc7a832010-02-28 20:49:53 +0000346 ContractNodes(MatcherPtr, CGP);
Chris Lattnerf4950d02010-02-27 06:22:57 +0000347 SinkPatternPredicates(MatcherPtr);
Chris Lattner0acf2ba2010-02-25 01:57:41 +0000348 FactorNodes(MatcherPtr);
Chris Lattner3ee1bc42010-02-24 07:31:45 +0000349 return MatcherPtr.take();
Chris Lattner36e646c2010-02-24 07:06:50 +0000350}