From: Sanjay Patel Date: Thu, 10 Nov 2016 00:15:14 +0000 (+0000) Subject: [InstCombine] avoid infinite loop from shuffle-extract-insert sequence (PR30923) X-Git-Tag: llvmorg-4.0.0-rc1~5070 X-Git-Url: http://review.tizen.org/git/?a=commitdiff_plain;h=4e1b5a53c728ea48460c7ca8c8ac28e9bef92334;p=platform%2Fupstream%2Fllvm.git [InstCombine] avoid infinite loop from shuffle-extract-insert sequence (PR30923) Removing the limitation in visitInsertElementInst() causes several regressions because we're not prepared to fold sequences of shuffles or inserts and extracts separated by shuffles. Fixing that appears to be a difficult mission because we are purposely trying to avoid creating shuffles with arbitrary shuffle masks because some targets may choke on those. https://llvm.org/bugs/show_bug.cgi?id=30923 llvm-svn: 286423 --- diff --git a/llvm/lib/Transforms/InstCombine/InstCombineVectorOps.cpp b/llvm/lib/Transforms/InstCombine/InstCombineVectorOps.cpp index 6c3aa3a..732a786 100644 --- a/llvm/lib/Transforms/InstCombine/InstCombineVectorOps.cpp +++ b/llvm/lib/Transforms/InstCombine/InstCombineVectorOps.cpp @@ -413,6 +413,14 @@ static void replaceExtractElements(InsertElementInst *InsElt, if (InsertionBlock != InsElt->getParent()) return; + // TODO: This restriction matches the check in visitInsertElementInst() and + // prevents an infinite loop caused by not turning the extract/insert pair + // into a shuffle. We really should not need either check, but we're lacking + // folds for shufflevectors because we're afraid to generate shuffle masks + // that the backend can't handle. + if (InsElt->hasOneUse() && isa(InsElt->user_back())) + return; + auto *WideVec = new ShuffleVectorInst(ExtVecOp, UndefValue::get(ExtVecType), ConstantVector::get(ExtendMask)); diff --git a/llvm/test/Transforms/InstCombine/insert-extract-shuffle.ll b/llvm/test/Transforms/InstCombine/insert-extract-shuffle.ll index 163c336..4507deb 100644 --- a/llvm/test/Transforms/InstCombine/insert-extract-shuffle.ll +++ b/llvm/test/Transforms/InstCombine/insert-extract-shuffle.ll @@ -237,3 +237,30 @@ end: ret double %mu } +; https://llvm.org/bugs/show_bug.cgi?id=30923 +; Delete the widening shuffle if we're not going to reduce the extract/insert to a shuffle. + +define <4 x float> @PR30923(<2 x float> %x) { +; CHECK-LABEL: @PR30923( +; CHECK-NEXT: bb1: +; CHECK-NEXT: [[EXT1:%.*]] = extractelement <2 x float> %x, i32 1 +; CHECK-NEXT: store float [[EXT1]], float* undef, align 4 +; CHECK-NEXT: br label %bb2 +; CHECK: bb2: +; CHECK-NEXT: [[EXT2:%.*]] = extractelement <2 x float> %x, i32 0 +; CHECK-NEXT: [[INS1:%.*]] = insertelement <4 x float> , float [[EXT2]], i32 2 +; CHECK-NEXT: [[INS2:%.*]] = insertelement <4 x float> [[INS1]], float [[EXT1]], i32 3 +; CHECK-NEXT: ret <4 x float> [[INS2]] +; +bb1: + %ext1 = extractelement <2 x float> %x, i32 1 + store float %ext1, float* undef, align 4 + br label %bb2 + +bb2: + %widen = shufflevector <2 x float> %x, <2 x float> undef, <4 x i32> + %ext2 = extractelement <4 x float> %widen, i32 0 + %ins1 = insertelement <4 x float> , float %ext2, i32 2 + %ins2 = insertelement <4 x float> %ins1, float %ext1, i32 3 + ret <4 x float> %ins2 +}