From 01494c6a7318395f577f41bd57b4bf8ca2591309 Mon Sep 17 00:00:00 2001 From: Simon Pilgrim Date: Thu, 13 Jan 2022 15:25:13 +0000 Subject: [PATCH] [X86] Add tests showing failure to merge shuffles through avx2 shift binops --- llvm/test/CodeGen/X86/combine-avx2-intrinsics.ll | 49 ++++++++++++++++++++++++ 1 file changed, 49 insertions(+) diff --git a/llvm/test/CodeGen/X86/combine-avx2-intrinsics.ll b/llvm/test/CodeGen/X86/combine-avx2-intrinsics.ll index 1128411..8562f80 100644 --- a/llvm/test/CodeGen/X86/combine-avx2-intrinsics.ll +++ b/llvm/test/CodeGen/X86/combine-avx2-intrinsics.ll @@ -122,6 +122,55 @@ define <4 x i64> @demandedelts_vpsrlvq(<4 x i64> %a0, <4 x i64> %a1) { ret <4 x i64> %result } +; +; isBinOp Handling (TODO) +; + +define <4 x i32> @binop_shuffle_vpsllvd(<4 x i32> %a0, <4 x i32> %a1) { +; CHECK-LABEL: binop_shuffle_vpsllvd: +; CHECK: # %bb.0: +; CHECK-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[3,2,1,0] +; CHECK-NEXT: vpshufd {{.*#+}} xmm1 = xmm1[3,2,1,0] +; CHECK-NEXT: vpsllvd %xmm1, %xmm0, %xmm0 +; CHECK-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[3,2,1,0] +; CHECK-NEXT: retq + %shuffle0 = shufflevector <4 x i32> %a0, <4 x i32> undef, <4 x i32> + %shuffle1 = shufflevector <4 x i32> %a1, <4 x i32> undef, <4 x i32> + %shift = call <4 x i32> @llvm.x86.avx2.psllv.d(<4 x i32> %shuffle0, <4 x i32> %shuffle1) + %res = shufflevector <4 x i32> %shift, <4 x i32> undef, <4 x i32> + ret <4 x i32> %res +} + +define <8 x i32> @binop_shuffle_vpsravd(<8 x i32> %a0, <8 x i32> %a1) { +; CHECK-LABEL: binop_shuffle_vpsravd: +; CHECK: # %bb.0: +; CHECK-NEXT: vpshufd {{.*#+}} ymm0 = ymm0[3,2,1,0,7,6,5,4] +; CHECK-NEXT: vpshufd {{.*#+}} ymm1 = ymm1[3,2,1,0,7,6,5,4] +; CHECK-NEXT: vpsravd %ymm1, %ymm0, %ymm0 +; CHECK-NEXT: vpshufd {{.*#+}} ymm0 = ymm0[3,2,1,0,7,6,5,4] +; CHECK-NEXT: retq + %shuffle0 = shufflevector <8 x i32> %a0, <8 x i32> undef, <8 x i32> + %shuffle1 = shufflevector <8 x i32> %a1, <8 x i32> undef, <8 x i32> + %shift = call <8 x i32> @llvm.x86.avx2.psrav.d.256(<8 x i32> %shuffle0, <8 x i32> %shuffle1) + %res = shufflevector <8 x i32> %shift, <8 x i32> undef, <8 x i32> + ret <8 x i32> %res +} + +define <4 x i64> @binop_shuffle_vpsrlvq(<4 x i64> %a0, <4 x i64> %a1) { +; CHECK-LABEL: binop_shuffle_vpsrlvq: +; CHECK: # %bb.0: +; CHECK-NEXT: vpermq {{.*#+}} ymm0 = ymm0[3,2,1,0] +; CHECK-NEXT: vpermq {{.*#+}} ymm1 = ymm1[3,2,1,0] +; CHECK-NEXT: vpsrlvq %ymm1, %ymm0, %ymm0 +; CHECK-NEXT: vpermq {{.*#+}} ymm0 = ymm0[3,2,1,0] +; CHECK-NEXT: retq + %shuffle0 = shufflevector <4 x i64> %a0, <4 x i64> undef, <4 x i32> + %shuffle1 = shufflevector <4 x i64> %a1, <4 x i64> undef, <4 x i32> + %shift = call <4 x i64> @llvm.x86.avx2.psrlv.q.256(<4 x i64> %shuffle0, <4 x i64> %shuffle1) + %res = shufflevector <4 x i64> %shift, <4 x i64> undef, <4 x i32> + ret <4 x i64> %res +} + declare <16 x i16> @llvm.x86.avx2.pblendw(<16 x i16>, <16 x i16>, i32) declare <4 x i32> @llvm.x86.avx2.pblendd.128(<4 x i32>, <4 x i32>, i32) declare <8 x i32> @llvm.x86.avx2.pblendd.256(<8 x i32>, <8 x i32>, i32) -- 2.7.4