Correctly handle a one-word struct passed byval on x86_64.
rdar://problem/6920088


git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@132105 91177308-0d34-0410-b5e6-96231b3b80d8
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp
index c8c3f59..fd7d1f7 100644
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -2091,28 +2091,54 @@
     }
 
     if (VA.isRegLoc()) {
-      RegsToPass.push_back(std::make_pair(VA.getLocReg(), Arg));
-      if (isVarArg && IsWin64) {
-        // Win64 ABI requires argument XMM reg to be copied to the corresponding
-        // shadow reg if callee is a varargs function.
-        unsigned ShadowReg = 0;
-        switch (VA.getLocReg()) {
-        case X86::XMM0: ShadowReg = X86::RCX; break;
-        case X86::XMM1: ShadowReg = X86::RDX; break;
-        case X86::XMM2: ShadowReg = X86::R8; break;
-        case X86::XMM3: ShadowReg = X86::R9; break;
+      if (isByVal) {
+        if (CCInfo.isFirstByValRegValid()) {
+          EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
+          unsigned reg = CCInfo.getFirstByValReg();
+          SDValue Load = DAG.getLoad(PtrVT, dl, Chain, Arg,
+                                     MachinePointerInfo(),
+                                     false, false, 0);
+          MemOpChains.push_back(Load.getValue(1));
+          RegsToPass.push_back(std::make_pair(reg, Load));
+          if (Flags.getByValSize() > 8) {
+            SDValue Const8 = DAG.getConstant(8, MVT::i32);
+            SDValue AddArg = DAG.getNode(ISD::ADD, dl, PtrVT, Arg, Const8);
+            SDValue Load2 = DAG.getLoad(PtrVT, dl, Chain, AddArg,
+                                       MachinePointerInfo(),
+                                       false, false, 0);
+            MemOpChains.push_back(Load.getValue(1));
+            RegsToPass.push_back(std::make_pair(reg+1, Load));
+          }
+          CCInfo.clearFirstByValReg();
         }
-        if (ShadowReg)
-          RegsToPass.push_back(std::make_pair(ShadowReg, Arg));
+      } else {
+        // Usual case:
+        RegsToPass.push_back(std::make_pair(VA.getLocReg(), Arg));
+        if (isVarArg && IsWin64) {
+          // Win64 ABI requires argument XMM reg to be copied to the corresponding
+          // shadow reg if callee is a varargs function.
+          unsigned ShadowReg = 0;
+          switch (VA.getLocReg()) {
+          case X86::XMM0: ShadowReg = X86::RCX; break;
+          case X86::XMM1: ShadowReg = X86::RDX; break;
+          case X86::XMM2: ShadowReg = X86::R8; break;
+          case X86::XMM3: ShadowReg = X86::R9; break;
+          }
+          if (ShadowReg)
+            RegsToPass.push_back(std::make_pair(ShadowReg, Arg));
+        }
       }
     } else if (!IsSibcall && (!isTailCall || isByVal)) {
+      if (isByVal) {    // In memory.
+        // ??
+      }
       assert(VA.isMemLoc());
       if (StackPtr.getNode() == 0)
         StackPtr = DAG.getCopyFromReg(Chain, dl, X86StackPtr, getPointerTy());
       MemOpChains.push_back(LowerMemOpCallTo(Chain, StackPtr, Arg,
                                              dl, DAG, VA, Flags));
     }
-  }
+  }     // end for (all register/memloc assignments)
 
   if (!MemOpChains.empty())
     Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
@@ -2438,6 +2464,39 @@
   return Offset;
 }
 
+/// HandleByVal - Every parameter *after* a byval parameter is passed
+/// on the stack.  Remember the next parameter register to allocate,
+/// and then confiscate the rest of the parameter registers to insure
+/// this.
+void
+llvm::X86TargetLowering::HandleByVal(CCState *State, unsigned &size) const {
+  if (!Subtarget->is64Bit())
+    return;
+
+  if (size == 0 || size > 16)
+    return;
+
+  int RegsRequired = (size > 8) ? 2 : 1;
+
+  static const unsigned GPR64ArgRegs64Bit[] = {
+    X86::RDI, X86::RSI, X86::RDX, X86::RCX, X86::R8, X86::R9
+  };
+  unsigned NextRegToAlloc = State->getFirstUnallocated(GPR64ArgRegs64Bit, 6);
+
+  // If insufficient registers available
+  if (NextRegToAlloc + RegsRequired > 6)
+    return;
+
+  size = 0;     // Tell caller not to allocate stack.
+
+  unsigned reg = State->AllocateReg(GPR64ArgRegs64Bit, 6);
+  State->setFirstByValReg(reg);
+  
+  if (RegsRequired == 2) {
+    State->AllocateReg(GPR64ArgRegs64Bit, 6);
+  }
+}
+
 /// MatchingStackOffset - Return true if the given stack call argument is
 /// already available in the same position (relatively) of the caller's
 /// incoming argument stack.