Index: lib/Target/AMDGPU/AMDGPUPromoteAlloca.cpp =================================================================== --- lib/Target/AMDGPU/AMDGPUPromoteAlloca.cpp +++ lib/Target/AMDGPU/AMDGPUPromoteAlloca.cpp @@ -21,6 +21,7 @@ #include "llvm/ADT/StringRef.h" #include "llvm/ADT/Triple.h" #include "llvm/ADT/Twine.h" +#include "llvm/Analysis/CaptureTracking.h" #include "llvm/Analysis/ValueTracking.h" #include "llvm/IR/Attributes.h" #include "llvm/IR/BasicBlock.h" @@ -608,6 +609,9 @@ } if (UseInst->getOpcode() == Instruction::AddrSpaceCast) { + // Give up if the pointer may be captured. + if (PointerMayBeCaptured(UseInst, true, true)) + return false; // Don't collect the users of this. WorkList.push_back(User); continue; Index: test/CodeGen/AMDGPU/addrspacecast-captured.ll =================================================================== --- /dev/null +++ test/CodeGen/AMDGPU/addrspacecast-captured.ll @@ -0,0 +1,19 @@ +; RUN: opt -S -mtriple=amdgcn-unknown-amdhsa -mcpu=kaveri -amdgpu-promote-alloca < %s | FileCheck %s + +; Nothing should be done if the addrspacecast is captured. + +; CHECK-LABEL: @addrspacecast_captured( +; CHECK: %data = alloca i32, align 4 +; CHECK: %tmp = addrspacecast i32* %data to i32 addrspace(4)* +; CHECK: %0 = ptrtoint i32 addrspace(4)* %tmp to i32 +; CHECK: store i32 %0, i32 addrspace(1)* %out +define void @addrspacecast_captured(i32 addrspace(1)* %out) #0 { +entry: + %data = alloca i32, align 4 + %tmp = addrspacecast i32* %data to i32 addrspace(4)* + %0 = ptrtoint i32 addrspace(4)* %tmp to i32 + store i32 %0, i32 addrspace(1)* %out + ret void +} + +attributes #0 = { nounwind }