Handle Neon v2f64 and v2i64 vector shuffles as register copies.
This fixes the remaining issue with pr7167. llvm-svn: 104257
This commit is contained in:
parent
63d4f68df4
commit
5954994bba
|
|
@ -3022,6 +3022,24 @@ static SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) {
|
||||||
return GeneratePerfectShuffle(PFEntry, V1, V2, DAG, dl);
|
return GeneratePerfectShuffle(PFEntry, V1, V2, DAG, dl);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// v2f64 and v2i64 shuffles are just register copies.
|
||||||
|
if (VT == MVT::v2f64 || VT == MVT::v2i64) {
|
||||||
|
// Do the expansion as f64 since i64 is not legal.
|
||||||
|
V1 = DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v2f64, V1);
|
||||||
|
V2 = DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v2f64, V2);
|
||||||
|
SDValue Val = DAG.getUNDEF(MVT::v2f64);
|
||||||
|
for (unsigned i = 0; i < 2; ++i) {
|
||||||
|
if (ShuffleMask[i] < 0)
|
||||||
|
continue;
|
||||||
|
SDValue Elt = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::f64,
|
||||||
|
ShuffleMask[i] < 2 ? V1 : V2,
|
||||||
|
DAG.getConstant(ShuffleMask[i] & 1, MVT::i32));
|
||||||
|
Val = DAG.getNode(ISD::INSERT_VECTOR_ELT, dl, MVT::v2f64, Val,
|
||||||
|
Elt, DAG.getConstant(i, MVT::i32));
|
||||||
|
}
|
||||||
|
return DAG.getNode(ISD::BIT_CONVERT, dl, VT, Val);
|
||||||
|
}
|
||||||
|
|
||||||
return SDValue();
|
return SDValue();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -12,3 +12,10 @@ define <8 x i8> @f2(<8 x i8> %x) nounwind {
|
||||||
<8 x i32> <i32 1, i32 2, i32 0, i32 5, i32 3, i32 6, i32 7, i32 4>
|
<8 x i32> <i32 1, i32 2, i32 0, i32 5, i32 3, i32 6, i32 7, i32 4>
|
||||||
ret <8 x i8> %y
|
ret <8 x i8> %y
|
||||||
}
|
}
|
||||||
|
|
||||||
|
define void @f3(<4 x i64>* %xp) nounwind {
|
||||||
|
%x = load <4 x i64>* %xp
|
||||||
|
%y = shufflevector <4 x i64> %x, <4 x i64> undef, <4 x i32> <i32 0, i32 3, i32 2, i32 1>
|
||||||
|
store <4 x i64> %y, <4 x i64>* %xp
|
||||||
|
ret void
|
||||||
|
}
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue