AMDGPU: Switch barrier intrinsics to using convergent noduplicate prevents unrolling of small loops that happen to have barriers in them. If a loop has a barrier in it, it is OK to duplicate it for the unroll. llvm-svn: 256075

commit: 2aed6ca1d33468f7e6f8509213a1b9dcd8026ec1 [log] [tgz]
author: Matt Arsenault <Matthew.Arsenault@amd.com> Sat Dec 19 01:46:41 2015 +0000
committer: Matt Arsenault <Matthew.Arsenault@amd.com> Sat Dec 19 01:46:41 2015 +0000
tree: a4575401ecb619e067cc2b4fed2a83056b80163c
parent: 10a509292cda51aabf3630bf30ceb990d3bf3108 [diff] [blame]
diff --git a/llvm/test/CodeGen/AMDGPU/array-ptr-calc-i32.ll b/llvm/test/CodeGen/AMDGPU/array-ptr-calc-i32.ll
index 67738f7..f8a7422 100644
--- a/llvm/test/CodeGen/AMDGPU/array-ptr-calc-i32.ll
+++ b/llvm/test/CodeGen/AMDGPU/array-ptr-calc-i32.ll

@@ -2,7 +2,7 @@
 ; RUN: llc -verify-machineinstrs -march=amdgcn -mcpu=SI -mattr=+promote-alloca < %s | FileCheck -check-prefix=SI-PROMOTE -check-prefix=SI %s
 
 declare i32 @llvm.SI.tid() nounwind readnone
-declare void @llvm.AMDGPU.barrier.local() nounwind noduplicate
+declare void @llvm.AMDGPU.barrier.local() nounwind convergent
 
 ; The required pointer calculations for the alloca'd actually requires
 ; an add and won't be folded into the addressing, which fails with a
@@ -35,7 +35,7 @@
   %alloca_ptr = getelementptr [4 x i32], [4 x i32]* %alloca, i32 1, i32 %b
   store i32 %result, i32* %alloca_ptr, align 4
   ; Dummy call
-  call void @llvm.AMDGPU.barrier.local() nounwind noduplicate
+  call void @llvm.AMDGPU.barrier.local() nounwind convergent
   %reload = load i32, i32* %alloca_ptr, align 4
   %out_ptr = getelementptr i32, i32 addrspace(1)* %out, i32 %tid
   store i32 %reload, i32 addrspace(1)* %out_ptr, align 4
commit	2aed6ca1d33468f7e6f8509213a1b9dcd8026ec1	[log] [tgz]
author	Matt Arsenault <Matthew.Arsenault@amd.com>	Sat Dec 19 01:46:41 2015 +0000
committer	Matt Arsenault <Matthew.Arsenault@amd.com>	Sat Dec 19 01:46:41 2015 +0000
tree	a4575401ecb619e067cc2b4fed2a83056b80163c
parent	10a509292cda51aabf3630bf30ceb990d3bf3108 [diff] [blame]