blob: 283de3b31da02f8ebbd165967694e1a026334b5d [file] [log] [blame]
Tom Stellardca166212017-01-30 21:56:46 +00001//===- AMDGPULegalizerInfo.cpp -----------------------------------*- C++ -*-==//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9/// \file
10/// This file implements the targeting of the Machinelegalizer class for
11/// AMDGPU.
12/// \todo This should be generated by TableGen.
13//===----------------------------------------------------------------------===//
14
Yaxun Liu0124b542018-02-13 18:00:25 +000015#include "AMDGPU.h"
Tom Stellardca166212017-01-30 21:56:46 +000016#include "AMDGPULegalizerInfo.h"
Matt Arsenault85803362018-03-17 15:17:41 +000017#include "AMDGPUTargetMachine.h"
David Blaikieb3bde2e2017-11-17 01:07:10 +000018#include "llvm/CodeGen/TargetOpcodes.h"
Tom Stellardca166212017-01-30 21:56:46 +000019#include "llvm/CodeGen/ValueTypes.h"
Tom Stellardca166212017-01-30 21:56:46 +000020#include "llvm/IR/DerivedTypes.h"
Chandler Carruth6bda14b2017-06-06 11:49:48 +000021#include "llvm/IR/Type.h"
Tom Stellardca166212017-01-30 21:56:46 +000022#include "llvm/Support/Debug.h"
23
24using namespace llvm;
Daniel Sanders9ade5592018-01-29 17:37:29 +000025using namespace LegalizeActions;
Tom Stellardca166212017-01-30 21:56:46 +000026
Matt Arsenaultc3fe46b2018-03-08 16:24:16 +000027AMDGPULegalizerInfo::AMDGPULegalizerInfo(const SISubtarget &ST,
28 const GCNTargetMachine &TM) {
Tom Stellardca166212017-01-30 21:56:46 +000029 using namespace TargetOpcode;
30
Matt Arsenault85803362018-03-17 15:17:41 +000031 auto GetAddrSpacePtr = [&TM](unsigned AS) {
32 return LLT::pointer(AS, TM.getPointerSizeInBits(AS));
33 };
34
35 const LLT S1 = LLT::scalar(1);
Tom Stellardff63ee02017-06-19 13:15:45 +000036 const LLT V2S16 = LLT::vector(2, 16);
Matt Arsenault85803362018-03-17 15:17:41 +000037
Tom Stellardca166212017-01-30 21:56:46 +000038 const LLT S32 = LLT::scalar(32);
39 const LLT S64 = LLT::scalar(64);
Matt Arsenault85803362018-03-17 15:17:41 +000040
41 const LLT GlobalPtr = GetAddrSpacePtr(AMDGPUAS::GLOBAL_ADDRESS);
42 const LLT ConstantPtr = GetAddrSpacePtr(AMDGPUAS::CONSTANT_ADDRESS);
43
Tom Stellardca166212017-01-30 21:56:46 +000044
Tom Stellardee6e6452017-06-12 20:54:56 +000045 setAction({G_ADD, S32}, Legal);
Matt Arsenaultdc14ec02018-03-01 19:22:05 +000046 setAction({G_MUL, S32}, Legal);
Tom Stellardaf552dc2017-06-23 15:17:17 +000047 setAction({G_AND, S32}, Legal);
Matt Arsenault3f6a2042018-03-01 19:09:21 +000048 setAction({G_OR, S32}, Legal);
49 setAction({G_XOR, S32}, Legal);
Tom Stellardee6e6452017-06-12 20:54:56 +000050
Tom Stellardff63ee02017-06-19 13:15:45 +000051 setAction({G_BITCAST, V2S16}, Legal);
52 setAction({G_BITCAST, 1, S32}, Legal);
53
54 setAction({G_BITCAST, S32}, Legal);
55 setAction({G_BITCAST, 1, V2S16}, Legal);
56
Tom Stellarde0424122017-06-03 01:13:33 +000057 // FIXME: i1 operands to intrinsics should always be legal, but other i1
58 // values may not be legal. We need to figure out how to distinguish
59 // between these two scenarios.
60 setAction({G_CONSTANT, S1}, Legal);
Tom Stellarda0d67c72017-05-12 16:46:46 +000061 setAction({G_CONSTANT, S32}, Legal);
Tom Stellardca166212017-01-30 21:56:46 +000062 setAction({G_CONSTANT, S64}, Legal);
63
Tom Stellarddde28a82017-05-26 16:40:03 +000064 setAction({G_FCONSTANT, S32}, Legal);
Matt Arsenault2a26a282018-02-26 17:20:43 +000065 setAction({G_FCONSTANT, S64}, Legal);
Tom Stellarddde28a82017-05-26 16:40:03 +000066
Matt Arsenault06cbb272018-03-01 19:16:52 +000067 setAction({G_IMPLICIT_DEF, S32}, Legal);
68 setAction({G_IMPLICIT_DEF, S64}, Legal);
69
Tom Stellardd0c6cf22017-10-27 23:57:41 +000070 setAction({G_FADD, S32}, Legal);
71
Matt Arsenault8e80a5f2018-03-01 19:09:16 +000072 setAction({G_FCMP, S1}, Legal);
73 setAction({G_FCMP, 1, S32}, Legal);
74 setAction({G_FCMP, 1, S64}, Legal);
75
Tom Stellard3337d742017-08-02 22:56:30 +000076 setAction({G_FMUL, S32}, Legal);
77
Matt Arsenault0529a8e2018-03-01 20:56:21 +000078 setAction({G_ZEXT, S64}, Legal);
79 setAction({G_ZEXT, 1, S32}, Legal);
80
Matt Arsenaultdd022ce2018-03-01 19:04:25 +000081 setAction({G_FPTOSI, S32}, Legal);
82 setAction({G_FPTOSI, 1, S32}, Legal);
83
Tom Stellard33445762018-02-07 04:47:59 +000084 setAction({G_FPTOUI, S32}, Legal);
85 setAction({G_FPTOUI, 1, S32}, Legal);
86
Matt Arsenault85803362018-03-17 15:17:41 +000087 setAction({G_GEP, GlobalPtr}, Legal);
88 setAction({G_GEP, ConstantPtr}, Legal);
Tom Stellardca166212017-01-30 21:56:46 +000089 setAction({G_GEP, 1, S64}, Legal);
90
Tom Stellard8cd60a52017-06-06 14:16:50 +000091 setAction({G_ICMP, S1}, Legal);
92 setAction({G_ICMP, 1, S32}, Legal);
93
Matt Arsenault85803362018-03-17 15:17:41 +000094
95 getActionDefinitionsBuilder({G_LOAD, G_STORE})
96 .legalIf([=, &ST](const LegalityQuery &Query) {
97 const LLT &Ty0 = Query.Types[0];
98
99 // TODO: Decompose private loads into 4-byte components.
100 // TODO: Illegal flat loads on SI
101 switch (Ty0.getSizeInBits()) {
102 case 32:
103 case 64:
104 case 128:
105 return true;
106
107 case 96:
108 // XXX hasLoadX3
109 return (ST.getGeneration() >= AMDGPUSubtarget::SEA_ISLANDS);
110
111 case 256:
112 case 512:
113 // TODO: constant loads
114 default:
115 return false;
116 }
117 });
118
119
Tom Stellardca166212017-01-30 21:56:46 +0000120
Tom Stellard2860a422017-06-07 13:54:51 +0000121 setAction({G_SELECT, S32}, Legal);
122 setAction({G_SELECT, 1, S1}, Legal);
123
Tom Stellardeb8f1e22017-06-26 15:56:52 +0000124 setAction({G_SHL, S32}, Legal);
125
Tom Stellardca166212017-01-30 21:56:46 +0000126
127 // FIXME: When RegBankSelect inserts copies, it will only create new
128 // registers with scalar types. This means we can end up with
129 // G_LOAD/G_STORE/G_GEP instruction with scalar types for their pointer
130 // operands. In assert builds, the instruction selector will assert
131 // if it sees a generic instruction which isn't legal, so we need to
132 // tell it that scalar types are legal for pointer operands
133 setAction({G_GEP, S64}, Legal);
Tom Stellardca166212017-01-30 21:56:46 +0000134
Matt Arsenault7b9ed892018-03-12 13:35:53 +0000135 for (unsigned Op : {G_EXTRACT_VECTOR_ELT, G_INSERT_VECTOR_ELT}) {
136 getActionDefinitionsBuilder(Op)
137 .legalIf([=](const LegalityQuery &Query) {
138 const LLT &VecTy = Query.Types[1];
139 const LLT &IdxTy = Query.Types[2];
140 return VecTy.getSizeInBits() % 32 == 0 &&
141 VecTy.getSizeInBits() <= 512 &&
142 IdxTy.getSizeInBits() == 32;
143 });
144 }
145
Matt Arsenault71272e62018-03-05 16:25:15 +0000146 // FIXME: Doesn't handle extract of illegal sizes.
147 getActionDefinitionsBuilder(G_EXTRACT)
148 .unsupportedIf([=](const LegalityQuery &Query) {
149 return Query.Types[0].getSizeInBits() >= Query.Types[1].getSizeInBits();
150 })
151 .legalIf([=](const LegalityQuery &Query) {
152 const LLT &Ty0 = Query.Types[0];
153 const LLT &Ty1 = Query.Types[1];
154 return (Ty0.getSizeInBits() % 32 == 0) &&
155 (Ty1.getSizeInBits() % 32 == 0);
156 });
157
Matt Arsenault503afda2018-03-12 13:35:43 +0000158 // Merge/Unmerge
159 for (unsigned Op : {G_MERGE_VALUES, G_UNMERGE_VALUES}) {
160 unsigned BigTyIdx = Op == G_MERGE_VALUES ? 0 : 1;
161 unsigned LitTyIdx = Op == G_MERGE_VALUES ? 1 : 0;
162
163 getActionDefinitionsBuilder(Op)
164 .legalIf([=](const LegalityQuery &Query) {
165 const LLT &BigTy = Query.Types[BigTyIdx];
166 const LLT &LitTy = Query.Types[LitTyIdx];
167 return BigTy.getSizeInBits() % 32 == 0 &&
168 LitTy.getSizeInBits() % 32 == 0 &&
169 BigTy.getSizeInBits() <= 512;
170 })
171 // Any vectors left are the wrong size. Scalarize them.
172 .fewerElementsIf([](const LegalityQuery &Query) { return true; },
173 [](const LegalityQuery &Query) {
174 return std::make_pair(
175 0, Query.Types[0].getElementType());
176 })
177 .fewerElementsIf([](const LegalityQuery &Query) { return true; },
178 [](const LegalityQuery &Query) {
179 return std::make_pair(
180 1, Query.Types[1].getElementType());
181 });
182
183 }
184
Tom Stellardca166212017-01-30 21:56:46 +0000185 computeTables();
186}