Eugene Zelenko | 76bf48d | 2017-06-26 22:44:03 +0000 | [diff] [blame] | 1 | //===- MacroFusion.cpp - Macro Fusion -------------------------------------===// |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 2 | // |
Chandler Carruth | 2946cd7 | 2019-01-19 08:50:56 +0000 | [diff] [blame] | 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | /// \file This file contains the implementation of the DAG scheduling mutation |
| 10 | /// to pair instructions back to back. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #include "llvm/CodeGen/MacroFusion.h" |
Eugene Zelenko | 76bf48d | 2017-06-26 22:44:03 +0000 | [diff] [blame] | 15 | #include "llvm/ADT/STLExtras.h" |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 16 | #include "llvm/ADT/Statistic.h" |
Eugene Zelenko | 76bf48d | 2017-06-26 22:44:03 +0000 | [diff] [blame] | 17 | #include "llvm/CodeGen/MachineInstr.h" |
| 18 | #include "llvm/CodeGen/MachineScheduler.h" |
| 19 | #include "llvm/CodeGen/ScheduleDAG.h" |
| 20 | #include "llvm/CodeGen/ScheduleDAGMutation.h" |
David Blaikie | 3f833ed | 2017-11-08 01:01:31 +0000 | [diff] [blame] | 21 | #include "llvm/CodeGen/TargetInstrInfo.h" |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 22 | #include "llvm/Support/CommandLine.h" |
Eugene Zelenko | 76bf48d | 2017-06-26 22:44:03 +0000 | [diff] [blame] | 23 | #include "llvm/Support/Debug.h" |
| 24 | #include "llvm/Support/raw_ostream.h" |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 25 | |
Evandro Menezes | 0cd23f56 | 2017-07-11 22:08:28 +0000 | [diff] [blame] | 26 | #define DEBUG_TYPE "machine-scheduler" |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 27 | |
| 28 | STATISTIC(NumFused, "Number of instr pairs fused"); |
| 29 | |
| 30 | using namespace llvm; |
| 31 | |
| 32 | static cl::opt<bool> EnableMacroFusion("misched-fusion", cl::Hidden, |
| 33 | cl::desc("Enable scheduling for macro fusion."), cl::init(true)); |
| 34 | |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 35 | static bool isHazard(const SDep &Dep) { |
| 36 | return Dep.getKind() == SDep::Anti || Dep.getKind() == SDep::Output; |
| 37 | } |
| 38 | |
QingShan Zhang | d84b320 | 2019-12-04 04:58:34 +0000 | [diff] [blame] | 39 | static SUnit *getPredClusterSU(const SUnit &SU) { |
| 40 | for (const SDep &SI : SU.Preds) |
| 41 | if (SI.isCluster()) |
| 42 | return SI.getSUnit(); |
| 43 | |
| 44 | return nullptr; |
| 45 | } |
| 46 | |
| 47 | static bool hasLessThanNumFused(const SUnit &SU, unsigned FuseLimit) { |
| 48 | unsigned Num = 1; |
| 49 | const SUnit *CurrentSU = &SU; |
| 50 | while ((CurrentSU = getPredClusterSU(*CurrentSU)) && Num < FuseLimit) Num ++; |
| 51 | return Num < FuseLimit; |
| 52 | } |
| 53 | |
Clement Courbet | b70355f | 2019-03-29 08:33:05 +0000 | [diff] [blame] | 54 | static bool fuseInstructionPair(ScheduleDAGInstrs &DAG, SUnit &FirstSU, |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 55 | SUnit &SecondSU) { |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 56 | // Check that neither instr is already paired with another along the edge |
| 57 | // between them. |
| 58 | for (SDep &SI : FirstSU.Succs) |
| 59 | if (SI.isCluster()) |
| 60 | return false; |
| 61 | |
| 62 | for (SDep &SI : SecondSU.Preds) |
| 63 | if (SI.isCluster()) |
| 64 | return false; |
| 65 | // Though the reachability checks above could be made more generic, |
Clement Courbet | b70355f | 2019-03-29 08:33:05 +0000 | [diff] [blame] | 66 | // perhaps as part of ScheduleDAGInstrs::addEdge(), since such edges are valid, |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 67 | // the extra computation cost makes it less interesting in general cases. |
| 68 | |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 69 | // Create a single weak edge between the adjacent instrs. The only effect is |
| 70 | // to cause bottom-up scheduling to heavily prioritize the clustered instrs. |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 71 | if (!DAG.addEdge(&SecondSU, SDep(&FirstSU, SDep::Cluster))) |
| 72 | return false; |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 73 | |
QingShan Zhang | 05b0c76 | 2019-12-10 03:10:21 +0000 | [diff] [blame] | 74 | // TODO - If we want to chain more than two instructions, we need to create |
| 75 | // artifical edges to make dependencies from the FirstSU also dependent |
| 76 | // on other chained instructions, and other chained instructions also |
| 77 | // dependent on the dependencies of the SecondSU, to prevent them from being |
| 78 | // scheduled into these chained instructions. |
| 79 | assert(hasLessThanNumFused(FirstSU, 2) && |
| 80 | "Currently we only support chaining together two instructions"); |
| 81 | |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 82 | // Adjust the latency between both instrs. |
| 83 | for (SDep &SI : FirstSU.Succs) |
| 84 | if (SI.getSUnit() == &SecondSU) |
| 85 | SI.setLatency(0); |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 86 | |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 87 | for (SDep &SI : SecondSU.Preds) |
| 88 | if (SI.getSUnit() == &FirstSU) |
| 89 | SI.setLatency(0); |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 90 | |
Nicola Zaghen | d34e60c | 2018-05-14 12:53:11 +0000 | [diff] [blame] | 91 | LLVM_DEBUG( |
Matthias Braun | 726e12c | 2018-09-19 00:23:35 +0000 | [diff] [blame] | 92 | dbgs() << "Macro fuse: "; DAG.dumpNodeName(FirstSU); dbgs() << " - "; |
| 93 | DAG.dumpNodeName(SecondSU); dbgs() << " / "; |
Nicola Zaghen | d34e60c | 2018-05-14 12:53:11 +0000 | [diff] [blame] | 94 | dbgs() << DAG.TII->getName(FirstSU.getInstr()->getOpcode()) << " - " |
| 95 | << DAG.TII->getName(SecondSU.getInstr()->getOpcode()) << '\n';); |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 96 | |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 97 | // Make data dependencies from the FirstSU also dependent on the SecondSU to |
| 98 | // prevent them from being scheduled between the FirstSU and the SecondSU. |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 99 | if (&SecondSU != &DAG.ExitSU) |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 100 | for (const SDep &SI : FirstSU.Succs) { |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 101 | SUnit *SU = SI.getSUnit(); |
| 102 | if (SI.isWeak() || isHazard(SI) || |
| 103 | SU == &DAG.ExitSU || SU == &SecondSU || SU->isPred(&SecondSU)) |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 104 | continue; |
Matthias Braun | 726e12c | 2018-09-19 00:23:35 +0000 | [diff] [blame] | 105 | LLVM_DEBUG(dbgs() << " Bind "; DAG.dumpNodeName(SecondSU); |
| 106 | dbgs() << " - "; DAG.dumpNodeName(*SU); dbgs() << '\n';); |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 107 | DAG.addEdge(SU, SDep(&SecondSU, SDep::Artificial)); |
| 108 | } |
| 109 | |
| 110 | // Make the FirstSU also dependent on the dependencies of the SecondSU to |
| 111 | // prevent them from being scheduled between the FirstSU and the SecondSU. |
Matthias Braun | 09810c9 | 2018-07-26 17:43:56 +0000 | [diff] [blame] | 112 | if (&FirstSU != &DAG.EntrySU) { |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 113 | for (const SDep &SI : SecondSU.Preds) { |
| 114 | SUnit *SU = SI.getSUnit(); |
| 115 | if (SI.isWeak() || isHazard(SI) || &FirstSU == SU || FirstSU.isSucc(SU)) |
| 116 | continue; |
Matthias Braun | 726e12c | 2018-09-19 00:23:35 +0000 | [diff] [blame] | 117 | LLVM_DEBUG(dbgs() << " Bind "; DAG.dumpNodeName(*SU); dbgs() << " - "; |
| 118 | DAG.dumpNodeName(FirstSU); dbgs() << '\n';); |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 119 | DAG.addEdge(&FirstSU, SDep(SU, SDep::Artificial)); |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 120 | } |
Matthias Braun | 09810c9 | 2018-07-26 17:43:56 +0000 | [diff] [blame] | 121 | // ExitSU comes last by design, which acts like an implicit dependency |
| 122 | // between ExitSU and any bottom root in the graph. We should transfer |
| 123 | // this to FirstSU as well. |
| 124 | if (&SecondSU == &DAG.ExitSU) { |
| 125 | for (SUnit &SU : DAG.SUnits) { |
| 126 | if (SU.Succs.empty()) |
| 127 | DAG.addEdge(&FirstSU, SDep(&SU, SDep::Artificial)); |
| 128 | } |
| 129 | } |
| 130 | } |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 131 | |
| 132 | ++NumFused; |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 133 | return true; |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 134 | } |
| 135 | |
Eugene Zelenko | 76bf48d | 2017-06-26 22:44:03 +0000 | [diff] [blame] | 136 | namespace { |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 137 | |
Adrian Prantl | 5f8f34e4 | 2018-05-01 15:54:18 +0000 | [diff] [blame] | 138 | /// Post-process the DAG to create cluster edges between instrs that may |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 139 | /// be fused by the processor into a single operation. |
| 140 | class MacroFusion : public ScheduleDAGMutation { |
| 141 | ShouldSchedulePredTy shouldScheduleAdjacent; |
| 142 | bool FuseBlock; |
Clement Courbet | b70355f | 2019-03-29 08:33:05 +0000 | [diff] [blame] | 143 | bool scheduleAdjacentImpl(ScheduleDAGInstrs &DAG, SUnit &AnchorSU); |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 144 | |
| 145 | public: |
| 146 | MacroFusion(ShouldSchedulePredTy shouldScheduleAdjacent, bool FuseBlock) |
| 147 | : shouldScheduleAdjacent(shouldScheduleAdjacent), FuseBlock(FuseBlock) {} |
| 148 | |
| 149 | void apply(ScheduleDAGInstrs *DAGInstrs) override; |
| 150 | }; |
| 151 | |
Eugene Zelenko | 76bf48d | 2017-06-26 22:44:03 +0000 | [diff] [blame] | 152 | } // end anonymous namespace |
| 153 | |
Clement Courbet | b70355f | 2019-03-29 08:33:05 +0000 | [diff] [blame] | 154 | void MacroFusion::apply(ScheduleDAGInstrs *DAG) { |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 155 | if (FuseBlock) |
| 156 | // For each of the SUnits in the scheduling block, try to fuse the instr in |
| 157 | // it with one in its predecessors. |
| 158 | for (SUnit &ISU : DAG->SUnits) |
| 159 | scheduleAdjacentImpl(*DAG, ISU); |
| 160 | |
| 161 | if (DAG->ExitSU.getInstr()) |
| 162 | // Try to fuse the instr in the ExitSU with one in its predecessors. |
| 163 | scheduleAdjacentImpl(*DAG, DAG->ExitSU); |
| 164 | } |
| 165 | |
Adrian Prantl | 5f8f34e4 | 2018-05-01 15:54:18 +0000 | [diff] [blame] | 166 | /// Implement the fusion of instr pairs in the scheduling DAG, |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 167 | /// anchored at the instr in AnchorSU.. |
Clement Courbet | b70355f | 2019-03-29 08:33:05 +0000 | [diff] [blame] | 168 | bool MacroFusion::scheduleAdjacentImpl(ScheduleDAGInstrs &DAG, SUnit &AnchorSU) { |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 169 | const MachineInstr &AnchorMI = *AnchorSU.getInstr(); |
| 170 | const TargetInstrInfo &TII = *DAG.TII; |
| 171 | const TargetSubtargetInfo &ST = DAG.MF.getSubtarget(); |
| 172 | |
| 173 | // Check if the anchor instr may be fused. |
| 174 | if (!shouldScheduleAdjacent(TII, ST, nullptr, AnchorMI)) |
| 175 | return false; |
| 176 | |
| 177 | // Explorer for fusion candidates among the dependencies of the anchor instr. |
| 178 | for (SDep &Dep : AnchorSU.Preds) { |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 179 | // Ignore dependencies other than data or strong ordering. |
| 180 | if (Dep.isWeak() || isHazard(Dep)) |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 181 | continue; |
| 182 | |
| 183 | SUnit &DepSU = *Dep.getSUnit(); |
| 184 | if (DepSU.isBoundaryNode()) |
| 185 | continue; |
| 186 | |
QingShan Zhang | d84b320 | 2019-12-04 04:58:34 +0000 | [diff] [blame] | 187 | // Only chain two instructions together at most. |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 188 | const MachineInstr *DepMI = DepSU.getInstr(); |
QingShan Zhang | d84b320 | 2019-12-04 04:58:34 +0000 | [diff] [blame] | 189 | if (!hasLessThanNumFused(DepSU, 2) || |
| 190 | !shouldScheduleAdjacent(TII, ST, DepMI, AnchorMI)) |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 191 | continue; |
| 192 | |
Evandro Menezes | 54be62d | 2017-12-11 21:09:27 +0000 | [diff] [blame] | 193 | if (fuseInstructionPair(DAG, DepSU, AnchorSU)) |
| 194 | return true; |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 195 | } |
| 196 | |
| 197 | return false; |
| 198 | } |
| 199 | |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 200 | std::unique_ptr<ScheduleDAGMutation> |
Eugene Zelenko | 76bf48d | 2017-06-26 22:44:03 +0000 | [diff] [blame] | 201 | llvm::createMacroFusionDAGMutation( |
| 202 | ShouldSchedulePredTy shouldScheduleAdjacent) { |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 203 | if(EnableMacroFusion) |
Jonas Devlieghere | 0eaee54 | 2019-08-15 15:54:37 +0000 | [diff] [blame] | 204 | return std::make_unique<MacroFusion>(shouldScheduleAdjacent, true); |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 205 | return nullptr; |
| 206 | } |
| 207 | |
| 208 | std::unique_ptr<ScheduleDAGMutation> |
Eugene Zelenko | 76bf48d | 2017-06-26 22:44:03 +0000 | [diff] [blame] | 209 | llvm::createBranchMacroFusionDAGMutation( |
| 210 | ShouldSchedulePredTy shouldScheduleAdjacent) { |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 211 | if(EnableMacroFusion) |
Jonas Devlieghere | 0eaee54 | 2019-08-15 15:54:37 +0000 | [diff] [blame] | 212 | return std::make_unique<MacroFusion>(shouldScheduleAdjacent, false); |
Florian Hahn | 5f746c8 | 2017-06-19 12:53:31 +0000 | [diff] [blame] | 213 | return nullptr; |
| 214 | } |