blob: 929ac2bd0d938b0eb8a3355a6a4d190e0c33a255 [file] [log] [blame]
Krzysztof Parzyszek95614ac2018-01-26 21:17:14 +00001//===- HexagonVExtract.cpp ------------------------------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9// This pass will replace multiple occurrences of V6_extractw from the same
10// vector register with a combination of a vector store and scalar loads.
11//===----------------------------------------------------------------------===//
12
13#include "Hexagon.h"
14#include "HexagonInstrInfo.h"
15#include "HexagonRegisterInfo.h"
16#include "HexagonSubtarget.h"
17#include "llvm/ADT/SmallVector.h"
18#include "llvm/PassSupport.h"
19#include "llvm/CodeGen/MachineBasicBlock.h"
20#include "llvm/CodeGen/MachineFunction.h"
21#include "llvm/CodeGen/MachineFunctionPass.h"
22#include "llvm/CodeGen/MachineInstrBuilder.h"
23#include "llvm/CodeGen/MachineRegisterInfo.h"
24#include "llvm/Support/CommandLine.h"
25
26#include <map>
27
28using namespace llvm;
29
30static cl::opt<unsigned> VExtractThreshold("hexagon-vextract-threshold",
31 cl::Hidden, cl::ZeroOrMore, cl::init(1),
32 cl::desc("Threshold for triggering vextract replacement"));
33
34namespace llvm {
35 void initializeHexagonVExtractPass(PassRegistry& Registry);
36 FunctionPass *createHexagonVExtract();
37}
38
39namespace {
40 class HexagonVExtract : public MachineFunctionPass {
41 public:
42 static char ID;
43 HexagonVExtract() : MachineFunctionPass(ID) {}
44
45 StringRef getPassName() const override {
46 return "Hexagon optimize vextract";
47 }
48 void getAnalysisUsage(AnalysisUsage &AU) const override {
49 MachineFunctionPass::getAnalysisUsage(AU);
50 }
51 bool runOnMachineFunction(MachineFunction &MF) override;
52
53 private:
54 const HexagonSubtarget *HST = nullptr;
55 const HexagonInstrInfo *HII = nullptr;
56
57 unsigned genElemLoad(MachineInstr *ExtI, unsigned BaseR,
58 MachineRegisterInfo &MRI);
59 };
60
61 char HexagonVExtract::ID = 0;
62}
63
64INITIALIZE_PASS(HexagonVExtract, "hexagon-vextract",
65 "Hexagon optimize vextract", false, false)
66
67unsigned HexagonVExtract::genElemLoad(MachineInstr *ExtI, unsigned BaseR,
68 MachineRegisterInfo &MRI) {
69 MachineBasicBlock &ExtB = *ExtI->getParent();
70 DebugLoc DL = ExtI->getDebugLoc();
71 unsigned ElemR = MRI.createVirtualRegister(&Hexagon::IntRegsRegClass);
72
73 unsigned ExtIdxR = ExtI->getOperand(2).getReg();
74 unsigned ExtIdxS = ExtI->getOperand(2).getSubReg();
75
76 // Simplified check for a compile-time constant value of ExtIdxR.
77 if (ExtIdxS == 0) {
78 MachineInstr *DI = MRI.getVRegDef(ExtIdxR);
79 if (DI->getOpcode() == Hexagon::A2_tfrsi) {
80 unsigned V = DI->getOperand(1).getImm();
81 V &= (HST->getVectorLength()-1) & -4u;
82
83 BuildMI(ExtB, ExtI, DL, HII->get(Hexagon::L2_loadri_io), ElemR)
84 .addReg(BaseR)
85 .addImm(V);
86 return ElemR;
87 }
88 }
89
90 unsigned IdxR = MRI.createVirtualRegister(&Hexagon::IntRegsRegClass);
91 BuildMI(ExtB, ExtI, DL, HII->get(Hexagon::A2_andir), IdxR)
92 .add(ExtI->getOperand(2))
93 .addImm(-4);
94 BuildMI(ExtB, ExtI, DL, HII->get(Hexagon::L4_loadri_rr), ElemR)
95 .addReg(BaseR)
96 .addReg(IdxR)
97 .addImm(0);
98 return ElemR;
99}
100
101bool HexagonVExtract::runOnMachineFunction(MachineFunction &MF) {
102 HST = &MF.getSubtarget<HexagonSubtarget>();
103 HII = HST->getInstrInfo();
104 const auto &HRI = *HST->getRegisterInfo();
105 MachineRegisterInfo &MRI = MF.getRegInfo();
106 MachineFrameInfo &MFI = MF.getFrameInfo();
107 std::map<unsigned, SmallVector<MachineInstr*,4>> VExtractMap;
108 bool Changed = false;
109
110 for (MachineBasicBlock &MBB : MF) {
111 for (MachineInstr &MI : MBB) {
112 unsigned Opc = MI.getOpcode();
113 if (Opc != Hexagon::V6_extractw)
114 continue;
115 unsigned VecR = MI.getOperand(1).getReg();
116 VExtractMap[VecR].push_back(&MI);
117 }
118 }
119
120 for (auto &P : VExtractMap) {
121 unsigned VecR = P.first;
122 if (P.second.size() <= VExtractThreshold)
123 continue;
124
125 const auto &VecRC = *MRI.getRegClass(VecR);
126 int FI = MFI.CreateSpillStackObject(HRI.getSpillSize(VecRC),
127 HRI.getSpillAlignment(VecRC));
128 MachineInstr *DefI = MRI.getVRegDef(VecR);
129 MachineBasicBlock::iterator At = std::next(DefI->getIterator());
130 MachineBasicBlock &DefB = *DefI->getParent();
131 unsigned StoreOpc = VecRC.getID() == Hexagon::HvxVRRegClassID
132 ? Hexagon::V6_vS32b_ai
133 : Hexagon::PS_vstorerw_ai;
134 BuildMI(DefB, At, DefI->getDebugLoc(), HII->get(StoreOpc))
135 .addFrameIndex(FI)
136 .addImm(0)
137 .addReg(VecR);
138
139 unsigned VecSize = HRI.getRegSizeInBits(VecRC) / 8;
140
141 for (MachineInstr *ExtI : P.second) {
142 assert(ExtI->getOpcode() == Hexagon::V6_extractw);
Krzysztof Parzyszek95614ac2018-01-26 21:17:14 +0000143 unsigned SR = ExtI->getOperand(1).getSubReg();
Richard Trieu8610c9f2018-01-26 21:55:13 +0000144 assert(ExtI->getOperand(1).getReg() == VecR);
Krzysztof Parzyszek95614ac2018-01-26 21:17:14 +0000145
146 MachineBasicBlock &ExtB = *ExtI->getParent();
147 DebugLoc DL = ExtI->getDebugLoc();
148 unsigned BaseR = MRI.createVirtualRegister(&Hexagon::IntRegsRegClass);
149 BuildMI(ExtB, ExtI, DL, HII->get(Hexagon::PS_fi), BaseR)
150 .addFrameIndex(FI)
151 .addImm(SR == 0 ? 0 : VecSize/2);
152
153 unsigned ElemR = genElemLoad(ExtI, BaseR, MRI);
154 unsigned ExtR = ExtI->getOperand(0).getReg();
155 MRI.replaceRegWith(ExtR, ElemR);
156 ExtB.erase(ExtI);
157 Changed = true;
158 }
159 }
160
161 return Changed;
162}
163
164FunctionPass *llvm::createHexagonVExtract() {
165 return new HexagonVExtract();
166}