| Justin Holewinski | ae556d3 | 2012-05-04 20:18:50 +0000 | [diff] [blame] | 1 | //===- NVPTXSubtarget.cpp - NVPTX Subtarget Information -------------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file implements the NVPTX specific subclass of TargetSubtarget. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #include "NVPTXSubtarget.h" |
| Eric Christopher | 6aad8b1 | 2015-02-19 00:08:14 +0000 | [diff] [blame] | 15 | #include "NVPTXTargetMachine.h" |
| Chandler Carruth | e96dd89 | 2014-04-21 22:55:11 +0000 | [diff] [blame] | 16 | |
| Chandler Carruth | d174b72 | 2014-04-22 02:03:14 +0000 | [diff] [blame] | 17 | using namespace llvm; |
| 18 | |
| Chandler Carruth | e96dd89 | 2014-04-21 22:55:11 +0000 | [diff] [blame] | 19 | #define DEBUG_TYPE "nvptx-subtarget" |
| 20 | |
| Justin Holewinski | ae556d3 | 2012-05-04 20:18:50 +0000 | [diff] [blame] | 21 | #define GET_SUBTARGETINFO_ENUM |
| 22 | #define GET_SUBTARGETINFO_TARGET_DESC |
| 23 | #define GET_SUBTARGETINFO_CTOR |
| 24 | #include "NVPTXGenSubtargetInfo.inc" |
| 25 | |
| Artem Belevich | 64dc9be | 2017-01-13 20:56:17 +0000 | [diff] [blame] | 26 | static cl::opt<bool> |
| 27 | NoF16Math("nvptx-no-f16-math", cl::ZeroOrMore, cl::Hidden, |
| 28 | cl::desc("NVPTX Specific: Disable generation of f16 math ops."), |
| 29 | cl::init(false)); |
| 30 | |
| Juergen Ributzka | d12ccbd | 2013-11-19 00:57:56 +0000 | [diff] [blame] | 31 | // Pin the vtable to this file. |
| 32 | void NVPTXSubtarget::anchor() {} |
| 33 | |
| Eric Christopher | 493f91b | 2014-06-27 04:33:14 +0000 | [diff] [blame] | 34 | NVPTXSubtarget &NVPTXSubtarget::initializeSubtargetDependencies(StringRef CPU, |
| 35 | StringRef FS) { |
| 36 | // Provide the default CPU if we don't have one. |
| Eric Christopher | d813286 | 2014-06-27 02:05:19 +0000 | [diff] [blame] | 37 | TargetName = CPU.empty() ? "sm_20" : CPU; |
| 38 | |
| 39 | ParseSubtargetFeatures(TargetName, FS); |
| Justin Holewinski | ae556d3 | 2012-05-04 20:18:50 +0000 | [diff] [blame] | 40 | |
| Justin Holewinski | 602fa5b | 2014-06-27 18:35:18 +0000 | [diff] [blame] | 41 | // Set default to PTX 3.2 (CUDA 5.5) |
| 42 | if (PTXVersion == 0) { |
| 43 | PTXVersion = 32; |
| 44 | } |
| Eric Christopher | 493f91b | 2014-06-27 04:33:14 +0000 | [diff] [blame] | 45 | |
| 46 | return *this; |
| 47 | } |
| 48 | |
| Daniel Sanders | a73f1fd | 2015-06-10 12:11:26 +0000 | [diff] [blame] | 49 | NVPTXSubtarget::NVPTXSubtarget(const Triple &TT, const std::string &CPU, |
| Eric Christopher | 6aad8b1 | 2015-02-19 00:08:14 +0000 | [diff] [blame] | 50 | const std::string &FS, |
| Eric Christopher | 02389e3 | 2015-02-19 00:08:27 +0000 | [diff] [blame] | 51 | const NVPTXTargetMachine &TM) |
| Daniel Sanders | 50f1723 | 2015-09-15 16:17:27 +0000 | [diff] [blame] | 52 | : NVPTXGenSubtargetInfo(TT, CPU, FS), PTXVersion(0), SmVersion(20), TM(TM), |
| 53 | InstrInfo(), TLInfo(TM, initializeSubtargetDependencies(CPU, FS)), |
| Mehdi Amini | 157e5a6 | 2015-07-09 02:10:08 +0000 | [diff] [blame] | 54 | FrameLowering() {} |
| Eric Christopher | 493f91b | 2014-06-27 04:33:14 +0000 | [diff] [blame] | 55 | |
| Eric Christopher | beffc4e | 2015-02-19 00:08:23 +0000 | [diff] [blame] | 56 | bool NVPTXSubtarget::hasImageHandles() const { |
| 57 | // Enable handles for Kepler+, where CUDA supports indirect surfaces and |
| 58 | // textures |
| 59 | if (TM.getDrvInterface() == NVPTX::CUDA) |
| 60 | return (SmVersion >= 30); |
| 61 | |
| 62 | // Disabled, otherwise |
| 63 | return false; |
| Justin Holewinski | ae556d3 | 2012-05-04 20:18:50 +0000 | [diff] [blame] | 64 | } |
| Artem Belevich | 64dc9be | 2017-01-13 20:56:17 +0000 | [diff] [blame] | 65 | |
| 66 | bool NVPTXSubtarget::allowFP16Math() const { |
| 67 | return hasFP16Math() && NoF16Math == false; |
| 68 | } |