[AVX] Implement 256-bit vector lowering for INSERT_VECTOR_ELT.

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@125187 91177308-0d34-0410-b5e6-96231b3b80d8
author: David Greene <greened@obbligato.org> 2011-02-09 15:32:06 +0000
committer: David Greene <greened@obbligato.org> 2011-02-09 15:32:06 +0000
commit: 6b38126da3dcc924b37715c70fa8abde69e02634 (patch)
tree: 202cd0fdbf07401a6e5236a0d1335978069f1d04 /lib
parent: 59982f3ffcc853a2c66ef674c601ee61dbe205a5 (diff)
download: llvm-6b38126da3dcc924b37715c70fa8abde69e02634.tar.gz
llvm-6b38126da3dcc924b37715c70fa8abde69e02634.tar.bz2
llvm-6b38126da3dcc924b37715c70fa8abde69e02634.tar.xz
1 files changed, 36 insertions, 6 deletions
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp
index b7599f097f..ea7eef7320 100644
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -125,7 +125,9 @@ static SDValue Extract128BitVector(SDValue Vec,
 
 /// Generate a DAG to put 128-bits into a vector > 128 bits.  This
 /// sets things up to match to an AVX VINSERTF128 instruction or a
-/// simple superregister reference.
+/// simple superregister reference.  Idx is an index in the 128 bits
+/// we want.  It need not be aligned to a 128-bit bounday.  That makes
+/// lowering INSERT_VECTOR_ELT operations easier.
 static SDValue Insert128BitVector(SDValue Result,
                                   SDValue Vec,
                                   SDValue Idx,
@@ -6027,17 +6029,45 @@ X86TargetLowering::LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const {
   EVT VT = Op.getValueType();
   EVT EltVT = VT.getVectorElementType();
 
+  DebugLoc dl = Op.getDebugLoc();
+  SDValue N0 = Op.getOperand(0);
+  SDValue N1 = Op.getOperand(1);
+  SDValue N2 = Op.getOperand(2);
+
+  // If this is a 256-bit vector result, first insert into a 128-bit
+  // vector and then insert into the 256-bit vector.
+  if (VT.getSizeInBits() > 128) {
+    if (!isa<ConstantSDNode>(N2))
+      return SDValue();
+
+    // Get the 128-bit vector.
+    unsigned NumElems = VT.getVectorNumElements();
+    unsigned IdxVal = cast<ConstantSDNode>(N2)->getZExtValue();
+    bool Upper = IdxVal >= NumElems / 2;
+
+    SDValue SubN0 = Extract128BitVector(N0, N2, DAG, dl);
+
+    // Insert into it.
+    SDValue ScaledN2 = N2;
+    if (Upper)
+      ScaledN2 = DAG.getNode(ISD::SUB, dl, N2.getValueType(), N2,
+                             DAG.getConstant(NumElems / 
+                                             (VT.getSizeInBits() / 128),
+                                             N2.getValueType()));
+    Op = DAG.getNode(ISD::INSERT_VECTOR_ELT, dl, SubN0.getValueType(), SubN0,
+                     N1, ScaledN2);
+
+    // Insert the 128-bit vector
+    // FIXME: Why UNDEF?
+    return Insert128BitVector(N0, Op, N2, DAG, dl);
+  }
+
   if (Subtarget->hasSSE41())
     return LowerINSERT_VECTOR_ELT_SSE4(Op, DAG);
 
   if (EltVT == MVT::i8)
     return SDValue();
 
-  DebugLoc dl = Op.getDebugLoc();
-  SDValue N0 = Op.getOperand(0);
-  SDValue N1 = Op.getOperand(1);
-  SDValue N2 = Op.getOperand(2);
-
   if (EltVT.getSizeInBits() == 16 && isa<ConstantSDNode>(N2)) {
     // Transform it so it match pinsrw which expects a 16-bit value in a GR32
     // as its second argument.
author	David Greene <greened@obbligato.org>	2011-02-09 15:32:06 +0000
committer	David Greene <greened@obbligato.org>	2011-02-09 15:32:06 +0000
commit	6b38126da3dcc924b37715c70fa8abde69e02634 (patch)
tree	202cd0fdbf07401a6e5236a0d1335978069f1d04 /lib
parent	59982f3ffcc853a2c66ef674c601ee61dbe205a5 (diff)
download	llvm-6b38126da3dcc924b37715c70fa8abde69e02634.tar.gz llvm-6b38126da3dcc924b37715c70fa8abde69e02634.tar.bz2 llvm-6b38126da3dcc924b37715c70fa8abde69e02634.tar.xz