From 9e0fd27ce7cd1a7b1a316760de7cf4795799af26 Mon Sep 17 00:00:00 2001 From: Hao Liu Date: Wed, 8 Jan 2014 03:06:15 +0000 Subject: [PATCH] Fix a bug about generating undef operand when optimising shuffle vector and insert element in instruction combine. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@198730 91177308-0d34-0410-b5e6-96231b3b80d8 --- .../InstCombine/InstCombineVectorOps.cpp | 5 +++-- test/Transforms/InstCombine/vec_shuffle.ll | 17 +++++++++++++++++ 2 files changed, 20 insertions(+), 2 deletions(-) diff --git a/lib/Transforms/InstCombine/InstCombineVectorOps.cpp b/lib/Transforms/InstCombine/InstCombineVectorOps.cpp index 1e724106991..c0b9b2fc3e5 100644 --- a/lib/Transforms/InstCombine/InstCombineVectorOps.cpp +++ b/lib/Transforms/InstCombine/InstCombineVectorOps.cpp @@ -763,9 +763,10 @@ InstCombiner::EvaluateInDifferentElementOrder(Value *V, ArrayRef Mask) { } } + // If element is not in Mask, no need to handle the operand 1 (element to + // be inserted). Just evaluate values in operand 0 according to Mask. if (!Found) - return UndefValue::get( - VectorType::get(V->getType()->getScalarType(), Mask.size())); + return EvaluateInDifferentElementOrder(I->getOperand(0), Mask); Value *V = EvaluateInDifferentElementOrder(I->getOperand(0), Mask); return InsertElementInst::Create(V, I->getOperand(1), diff --git a/test/Transforms/InstCombine/vec_shuffle.ll b/test/Transforms/InstCombine/vec_shuffle.ll index 3ee43dc63a6..a409a911ef1 100644 --- a/test/Transforms/InstCombine/vec_shuffle.ll +++ b/test/Transforms/InstCombine/vec_shuffle.ll @@ -228,3 +228,20 @@ define <4 x float> @test15b(<4 x float> %LHS, <4 x float> %RHS) { ret <4 x float> %tmp5 } +define <1 x i32> @test16a(i32 %ele) { +; CHECK-LABEL: @test16a( +; CHECK-NEXT: ret <1 x i32> + %tmp0 = insertelement <2 x i32> , i32 %ele, i32 1 + %tmp1 = shl <2 x i32> %tmp0, + %tmp2 = shufflevector <2 x i32> %tmp1, <2 x i32> undef, <1 x i32> + ret <1 x i32> %tmp2 +} + +define <4 x i8> @test16b(i8 %ele) { +; CHECK-LABEL: @test16b( +; CHECK-NEXT: ret <4 x i8> + %tmp0 = insertelement <8 x i8> , i8 %ele, i32 6 + %tmp1 = shl <8 x i8> %tmp0, + %tmp2 = shufflevector <8 x i8> %tmp1, <8 x i8> undef, <4 x i32> + ret <4 x i8> %tmp2 +} \ No newline at end of file -- 2.34.1