AMDGPU: Fix AMDGPUPromoteAlloca breaking addrspacecasts
authorMatt Arsenault <Matthew.Arsenault@amd.com>
Sat, 10 Dec 2016 00:52:50 +0000 (00:52 +0000)
committerMatt Arsenault <Matthew.Arsenault@amd.com>
Sat, 10 Dec 2016 00:52:50 +0000 (00:52 +0000)
The users of the addrspacecast were having their types incorrectly
changed, producing invalid bitcasts between address spaces.

llvm-svn: 289307

llvm/lib/Target/AMDGPU/AMDGPUPromoteAlloca.cpp
llvm/test/CodeGen/AMDGPU/promote-alloca-addrspacecast.ll [new file with mode: 0644]

index 296a8aa..baa28de 100644 (file)
@@ -579,6 +579,12 @@ bool AMDGPUPromoteAlloca::collectUsesWithPtrTypes(
       WorkList.push_back(ICmp);
     }
 
+    if (UseInst->getOpcode() == Instruction::AddrSpaceCast) {
+      // Don't collect the users of this.
+      WorkList.push_back(User);
+      continue;
+    }
+
     if (!User->getType()->isPointerTy())
       continue;
 
@@ -739,7 +745,8 @@ void AMDGPUPromoteAlloca::handleAlloca(AllocaInst &I) {
         continue;
       }
 
-      // The operand's value should be corrected on its own.
+      // The operand's value should be corrected on its own and we don't want to
+      // touch the users.
       if (isa<AddrSpaceCastInst>(V))
         continue;
 
diff --git a/llvm/test/CodeGen/AMDGPU/promote-alloca-addrspacecast.ll b/llvm/test/CodeGen/AMDGPU/promote-alloca-addrspacecast.ll
new file mode 100644 (file)
index 0000000..f00b3de
--- /dev/null
@@ -0,0 +1,21 @@
+; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -mcpu=kaveri -amdgpu-promote-alloca < %s | FileCheck %s
+
+; The types of the users of the addrspacecast should not be changed.
+
+; CHECK-LABEL: @invalid_bitcast_addrspace(
+; CHECK: getelementptr inbounds [256 x [1 x i32]], [256 x [1 x i32]] addrspace(3)* @invalid_bitcast_addrspace.data, i32 0, i32 %14
+; CHECK: bitcast [1 x i32] addrspace(3)* %{{[0-9]+}} to half addrspace(3)*
+; CHECK: addrspacecast half addrspace(3)* %tmp to half addrspace(4)*
+; CHECK: bitcast half addrspace(4)* %tmp1 to <2 x i16> addrspace(4)*
+define amdgpu_kernel void @invalid_bitcast_addrspace() #0 {
+entry:
+  %data = alloca [1 x i32], align 4
+  %tmp = bitcast [1 x i32]* %data to half*
+  %tmp1 = addrspacecast half* %tmp to half addrspace(4)*
+  %tmp2 = bitcast half addrspace(4)* %tmp1 to <2 x i16> addrspace(4)*
+  %tmp3 = load <2 x i16>, <2 x i16> addrspace(4)* %tmp2, align 2
+  %tmp4 = bitcast <2 x i16> %tmp3 to <2 x half>
+  ret void
+}
+
+attributes #0 = { nounwind }