Dan Gohman | 9becddd | 2010-04-16 23:04:22 +0000 | [diff] [blame] | 1 | //===-- ARMSelectionDAGInfo.cpp - ARM SelectionDAG Info -------------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file implements the ARMSelectionDAGInfo class. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 14 | #include "ARMTargetMachine.h" |
Renato Golin | 4cd5187 | 2011-05-22 21:41:23 +0000 | [diff] [blame] | 15 | #include "llvm/CodeGen/SelectionDAG.h" |
Chandler Carruth | 9fb823b | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 16 | #include "llvm/IR/DerivedTypes.h" |
Dan Gohman | 9becddd | 2010-04-16 23:04:22 +0000 | [diff] [blame] | 17 | using namespace llvm; |
| 18 | |
Chandler Carruth | 84e68b2 | 2014-04-22 02:41:26 +0000 | [diff] [blame] | 19 | #define DEBUG_TYPE "arm-selectiondag-info" |
| 20 | |
Eric Christopher | 70e005a | 2014-06-12 23:39:49 +0000 | [diff] [blame] | 21 | ARMSelectionDAGInfo::ARMSelectionDAGInfo(const DataLayout &DL) |
| 22 | : TargetSelectionDAGInfo(&DL) {} |
Dan Gohman | 9becddd | 2010-04-16 23:04:22 +0000 | [diff] [blame] | 23 | |
| 24 | ARMSelectionDAGInfo::~ARMSelectionDAGInfo() { |
| 25 | } |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 26 | |
| 27 | SDValue |
Andrew Trick | ef9de2a | 2013-05-25 02:42:55 +0000 | [diff] [blame] | 28 | ARMSelectionDAGInfo::EmitTargetCodeForMemcpy(SelectionDAG &DAG, SDLoc dl, |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 29 | SDValue Chain, |
| 30 | SDValue Dst, SDValue Src, |
| 31 | SDValue Size, unsigned Align, |
| 32 | bool isVolatile, bool AlwaysInline, |
Chris Lattner | 2510de2 | 2010-09-21 05:40:29 +0000 | [diff] [blame] | 33 | MachinePointerInfo DstPtrInfo, |
| 34 | MachinePointerInfo SrcPtrInfo) const { |
Eric Christopher | 22b2ad2 | 2015-02-20 08:24:37 +0000 | [diff] [blame] | 35 | const ARMSubtarget &Subtarget = |
| 36 | DAG.getMachineFunction().getSubtarget<ARMSubtarget>(); |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 37 | // Do repeated 4-byte loads and stores. To be improved. |
| 38 | // This requires 4-byte alignment. |
| 39 | if ((Align & 3) != 0) |
| 40 | return SDValue(); |
Chris Lattner | 0ab5e2c | 2011-04-15 05:18:47 +0000 | [diff] [blame] | 41 | // This requires the copy size to be a constant, preferably |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 42 | // within a subtarget-specific limit. |
| 43 | ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size); |
| 44 | if (!ConstantSize) |
| 45 | return SDValue(); |
| 46 | uint64_t SizeVal = ConstantSize->getZExtValue(); |
Eric Christopher | 70e005a | 2014-06-12 23:39:49 +0000 | [diff] [blame] | 47 | if (!AlwaysInline && SizeVal > Subtarget.getMaxInlineSizeThreshold()) |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 48 | return SDValue(); |
| 49 | |
| 50 | unsigned BytesLeft = SizeVal & 3; |
| 51 | unsigned NumMemOps = SizeVal >> 2; |
| 52 | unsigned EmittedNumMemOps = 0; |
| 53 | EVT VT = MVT::i32; |
| 54 | unsigned VTSize = 4; |
| 55 | unsigned i = 0; |
James Molloy | a70697e | 2014-05-16 14:24:22 +0000 | [diff] [blame] | 56 | // Emit a maximum of 4 loads in Thumb1 since we have fewer registers |
Eric Christopher | 70e005a | 2014-06-12 23:39:49 +0000 | [diff] [blame] | 57 | const unsigned MAX_LOADS_IN_LDM = Subtarget.isThumb1Only() ? 4 : 6; |
James Molloy | a70697e | 2014-05-16 14:24:22 +0000 | [diff] [blame] | 58 | SDValue TFOps[6]; |
| 59 | SDValue Loads[6]; |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 60 | uint64_t SrcOff = 0, DstOff = 0; |
| 61 | |
| 62 | // Emit up to MAX_LOADS_IN_LDM loads, then a TokenFactor barrier, then the |
| 63 | // same number of stores. The loads and stores will get combined into |
| 64 | // ldm/stm later on. |
| 65 | while (EmittedNumMemOps < NumMemOps) { |
| 66 | for (i = 0; |
| 67 | i < MAX_LOADS_IN_LDM && EmittedNumMemOps + i < NumMemOps; ++i) { |
| 68 | Loads[i] = DAG.getLoad(VT, dl, Chain, |
| 69 | DAG.getNode(ISD::ADD, dl, MVT::i32, Src, |
Sergey Dmitrouk | adb4c69 | 2015-04-28 11:56:37 +0000 | [diff] [blame^] | 70 | DAG.getConstant(SrcOff, dl, MVT::i32)), |
Chris Lattner | 2510de2 | 2010-09-21 05:40:29 +0000 | [diff] [blame] | 71 | SrcPtrInfo.getWithOffset(SrcOff), isVolatile, |
Pete Cooper | 82cd9e8 | 2011-11-08 18:42:53 +0000 | [diff] [blame] | 72 | false, false, 0); |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 73 | TFOps[i] = Loads[i].getValue(1); |
| 74 | SrcOff += VTSize; |
| 75 | } |
Craig Topper | 48d114b | 2014-04-26 18:35:24 +0000 | [diff] [blame] | 76 | Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, |
Craig Topper | 2d2aa0c | 2014-04-30 07:17:30 +0000 | [diff] [blame] | 77 | makeArrayRef(TFOps, i)); |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 78 | |
| 79 | for (i = 0; |
| 80 | i < MAX_LOADS_IN_LDM && EmittedNumMemOps + i < NumMemOps; ++i) { |
| 81 | TFOps[i] = DAG.getStore(Chain, dl, Loads[i], |
| 82 | DAG.getNode(ISD::ADD, dl, MVT::i32, Dst, |
Sergey Dmitrouk | adb4c69 | 2015-04-28 11:56:37 +0000 | [diff] [blame^] | 83 | DAG.getConstant(DstOff, dl, MVT::i32)), |
Chris Lattner | 2510de2 | 2010-09-21 05:40:29 +0000 | [diff] [blame] | 84 | DstPtrInfo.getWithOffset(DstOff), |
| 85 | isVolatile, false, 0); |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 86 | DstOff += VTSize; |
| 87 | } |
Craig Topper | 48d114b | 2014-04-26 18:35:24 +0000 | [diff] [blame] | 88 | Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, |
Craig Topper | 2d2aa0c | 2014-04-30 07:17:30 +0000 | [diff] [blame] | 89 | makeArrayRef(TFOps, i)); |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 90 | |
| 91 | EmittedNumMemOps += i; |
| 92 | } |
| 93 | |
| 94 | if (BytesLeft == 0) |
| 95 | return Chain; |
| 96 | |
| 97 | // Issue loads / stores for the trailing (1 - 3) bytes. |
| 98 | unsigned BytesLeftSave = BytesLeft; |
| 99 | i = 0; |
| 100 | while (BytesLeft) { |
| 101 | if (BytesLeft >= 2) { |
| 102 | VT = MVT::i16; |
| 103 | VTSize = 2; |
| 104 | } else { |
| 105 | VT = MVT::i8; |
| 106 | VTSize = 1; |
| 107 | } |
| 108 | |
| 109 | Loads[i] = DAG.getLoad(VT, dl, Chain, |
| 110 | DAG.getNode(ISD::ADD, dl, MVT::i32, Src, |
Sergey Dmitrouk | adb4c69 | 2015-04-28 11:56:37 +0000 | [diff] [blame^] | 111 | DAG.getConstant(SrcOff, dl, MVT::i32)), |
Pete Cooper | 82cd9e8 | 2011-11-08 18:42:53 +0000 | [diff] [blame] | 112 | SrcPtrInfo.getWithOffset(SrcOff), |
| 113 | false, false, false, 0); |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 114 | TFOps[i] = Loads[i].getValue(1); |
| 115 | ++i; |
| 116 | SrcOff += VTSize; |
| 117 | BytesLeft -= VTSize; |
| 118 | } |
Craig Topper | 48d114b | 2014-04-26 18:35:24 +0000 | [diff] [blame] | 119 | Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, |
Craig Topper | 2d2aa0c | 2014-04-30 07:17:30 +0000 | [diff] [blame] | 120 | makeArrayRef(TFOps, i)); |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 121 | |
| 122 | i = 0; |
| 123 | BytesLeft = BytesLeftSave; |
| 124 | while (BytesLeft) { |
| 125 | if (BytesLeft >= 2) { |
| 126 | VT = MVT::i16; |
| 127 | VTSize = 2; |
| 128 | } else { |
| 129 | VT = MVT::i8; |
| 130 | VTSize = 1; |
| 131 | } |
| 132 | |
| 133 | TFOps[i] = DAG.getStore(Chain, dl, Loads[i], |
| 134 | DAG.getNode(ISD::ADD, dl, MVT::i32, Dst, |
Sergey Dmitrouk | adb4c69 | 2015-04-28 11:56:37 +0000 | [diff] [blame^] | 135 | DAG.getConstant(DstOff, dl, MVT::i32)), |
Chris Lattner | 2510de2 | 2010-09-21 05:40:29 +0000 | [diff] [blame] | 136 | DstPtrInfo.getWithOffset(DstOff), false, false, 0); |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 137 | ++i; |
| 138 | DstOff += VTSize; |
| 139 | BytesLeft -= VTSize; |
| 140 | } |
Craig Topper | 48d114b | 2014-04-26 18:35:24 +0000 | [diff] [blame] | 141 | return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, |
Craig Topper | 2d2aa0c | 2014-04-30 07:17:30 +0000 | [diff] [blame] | 142 | makeArrayRef(TFOps, i)); |
Dan Gohman | bb919df | 2010-05-11 17:31:57 +0000 | [diff] [blame] | 143 | } |
Renato Golin | 4cd5187 | 2011-05-22 21:41:23 +0000 | [diff] [blame] | 144 | |
| 145 | // Adjust parameters for memset, EABI uses format (ptr, size, value), |
| 146 | // GNU library uses (ptr, value, size) |
| 147 | // See RTABI section 4.3.4 |
Jim Grosbach | e7e2aca | 2011-09-13 20:30:37 +0000 | [diff] [blame] | 148 | SDValue ARMSelectionDAGInfo:: |
Andrew Trick | ef9de2a | 2013-05-25 02:42:55 +0000 | [diff] [blame] | 149 | EmitTargetCodeForMemset(SelectionDAG &DAG, SDLoc dl, |
Jim Grosbach | e7e2aca | 2011-09-13 20:30:37 +0000 | [diff] [blame] | 150 | SDValue Chain, SDValue Dst, |
| 151 | SDValue Src, SDValue Size, |
| 152 | unsigned Align, bool isVolatile, |
| 153 | MachinePointerInfo DstPtrInfo) const { |
Eric Christopher | 22b2ad2 | 2015-02-20 08:24:37 +0000 | [diff] [blame] | 154 | const ARMSubtarget &Subtarget = |
| 155 | DAG.getMachineFunction().getSubtarget<ARMSubtarget>(); |
Tim Northover | d6a729b | 2014-01-06 14:28:05 +0000 | [diff] [blame] | 156 | // Use default for non-AAPCS (or MachO) subtargets |
Eric Christopher | 70e005a | 2014-06-12 23:39:49 +0000 | [diff] [blame] | 157 | if (!Subtarget.isAAPCS_ABI() || Subtarget.isTargetMachO() || |
| 158 | Subtarget.isTargetWindows()) |
Renato Golin | 4cd5187 | 2011-05-22 21:41:23 +0000 | [diff] [blame] | 159 | return SDValue(); |
| 160 | |
Eric Christopher | 22b2ad2 | 2015-02-20 08:24:37 +0000 | [diff] [blame] | 161 | const ARMTargetLowering &TLI = *Subtarget.getTargetLowering(); |
Renato Golin | 4cd5187 | 2011-05-22 21:41:23 +0000 | [diff] [blame] | 162 | TargetLowering::ArgListTy Args; |
| 163 | TargetLowering::ArgListEntry Entry; |
| 164 | |
| 165 | // First argument: data pointer |
Chandler Carruth | 7ec5085 | 2012-11-01 08:07:29 +0000 | [diff] [blame] | 166 | Type *IntPtrTy = TLI.getDataLayout()->getIntPtrType(*DAG.getContext()); |
Renato Golin | 4cd5187 | 2011-05-22 21:41:23 +0000 | [diff] [blame] | 167 | Entry.Node = Dst; |
| 168 | Entry.Ty = IntPtrTy; |
| 169 | Args.push_back(Entry); |
| 170 | |
| 171 | // Second argument: buffer size |
| 172 | Entry.Node = Size; |
| 173 | Entry.Ty = IntPtrTy; |
| 174 | Entry.isSExt = false; |
| 175 | Args.push_back(Entry); |
| 176 | |
| 177 | // Extend or truncate the argument to be an i32 value for the call. |
| 178 | if (Src.getValueType().bitsGT(MVT::i32)) |
| 179 | Src = DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, Src); |
| 180 | else |
| 181 | Src = DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i32, Src); |
| 182 | |
| 183 | // Third argument: value to fill |
| 184 | Entry.Node = Src; |
| 185 | Entry.Ty = Type::getInt32Ty(*DAG.getContext()); |
| 186 | Entry.isSExt = true; |
| 187 | Args.push_back(Entry); |
| 188 | |
| 189 | // Emit __eabi_memset call |
Saleem Abdulrasool | f3a5a5c | 2014-05-17 21:50:17 +0000 | [diff] [blame] | 190 | TargetLowering::CallLoweringInfo CLI(DAG); |
| 191 | CLI.setDebugLoc(dl).setChain(Chain) |
| 192 | .setCallee(TLI.getLibcallCallingConv(RTLIB::MEMSET), |
| 193 | Type::getVoidTy(*DAG.getContext()), |
| 194 | DAG.getExternalSymbol(TLI.getLibcallName(RTLIB::MEMSET), |
Juergen Ributzka | 3bd03c7 | 2014-07-01 22:01:54 +0000 | [diff] [blame] | 195 | TLI.getPointerTy()), std::move(Args), 0) |
Saleem Abdulrasool | f3a5a5c | 2014-05-17 21:50:17 +0000 | [diff] [blame] | 196 | .setDiscardResult(); |
Renato Golin | 4cd5187 | 2011-05-22 21:41:23 +0000 | [diff] [blame] | 197 | |
Saleem Abdulrasool | f3a5a5c | 2014-05-17 21:50:17 +0000 | [diff] [blame] | 198 | std::pair<SDValue,SDValue> CallResult = TLI.LowerCallTo(CLI); |
Renato Golin | 4cd5187 | 2011-05-22 21:41:23 +0000 | [diff] [blame] | 199 | return CallResult.second; |
| 200 | } |