blob: 3ae74abcb6cb7c7081a8ecff472769efd4632b75 [file] [log] [blame]
Matt Arsenaulta5329272017-05-17 21:38:21 +00001; RUN: llc < %s -march=amdgcn -verify-machineinstrs | FileCheck %s
Tom Stellard0f29de72015-02-05 15:32:15 +00002
3; This tests that the llvm.SI.end.cf intrinsic is not inserted into the
4; loop block. This intrinsic will be lowered to s_or_b64 by the code
5; generator.
6
7; CHECK-LABEL: {{^}}test:
8
9; This is was lowered from the llvm.SI.end.cf intrinsic:
10; CHECK: s_or_b64 exec, exec
11
12; CHECK: [[LOOP_LABEL:[0-9A-Za-z_]+]]: ; %loop{{$}}
13; CHECK-NOT: s_or_b64 exec, exec
14; CHECK: s_cbranch_execnz [[LOOP_LABEL]]
Matt Arsenault3dbeefa2017-03-21 21:39:51 +000015define amdgpu_kernel void @test(i32 addrspace(1)* %out) {
Tom Stellard0f29de72015-02-05 15:32:15 +000016entry:
Matt Arsenaulta5329272017-05-17 21:38:21 +000017 %cond = call i32 @llvm.amdgcn.workitem.id.x() #0
Tom Stellard0f29de72015-02-05 15:32:15 +000018 %tmp0 = icmp eq i32 %cond, 0
19 br i1 %tmp0, label %if, label %loop
20
21if:
22 store i32 0, i32 addrspace(1)* %out
23 br label %loop
24
25loop:
26 %tmp1 = phi i32 [0, %entry], [0, %if], [%inc, %loop]
27 %inc = add i32 %tmp1, %cond
28 %tmp2 = icmp ugt i32 %inc, 10
29 br i1 %tmp2, label %done, label %loop
30
31done:
David Blaikie79e6c742015-02-27 19:29:02 +000032 %tmp3 = getelementptr i32, i32 addrspace(1)* %out, i64 1
Tom Stellard0f29de72015-02-05 15:32:15 +000033 store i32 %inc, i32 addrspace(1)* %tmp3
34 ret void
35}
Tom Stellardbc4497b2016-02-12 23:45:29 +000036
Matt Arsenaulta5329272017-05-17 21:38:21 +000037declare i32 @llvm.amdgcn.workitem.id.x() #0
Tom Stellardbc4497b2016-02-12 23:45:29 +000038
Matt Arsenaulta5329272017-05-17 21:38:21 +000039attributes #0 = { nounwind readnone }