blob: 3be0f3a74e5f305b23df3396764d2b73fd23eba4 [file] [log] [blame]
Matt Arsenault88859102016-06-17 21:18:41 +00001; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s
Matt Arsenaultdbf9f312013-11-11 23:31:02 +00002
Matt Arsenault88859102016-06-17 21:18:41 +00003declare i32 @llvm.amdgcn.mbcnt.lo(i32, i32) #0
4declare i32 @llvm.amdgcn.mbcnt.hi(i32, i32) #0
Matt Arsenaultdbf9f312013-11-11 23:31:02 +00005
Tom Stellard79243d92014-10-01 17:15:17 +00006; SI-LABEL: {{^}}test_array_ptr_calc:
Matt Arsenault4eea3f32017-11-13 22:55:05 +00007; SI-DAG: v_mul_u32_u24
8; SI-DAG: v_mul_hi_u32_u24
Matt Arsenault24692112015-07-14 18:20:33 +00009; SI: s_endpgm
Matt Arsenault3dbeefa2017-03-21 21:39:51 +000010define amdgpu_kernel void @test_array_ptr_calc(i32 addrspace(1)* noalias %out, [1025 x i32] addrspace(1)* noalias %inA, i32 addrspace(1)* noalias %inB) {
Matt Arsenault88859102016-06-17 21:18:41 +000011 %mbcnt.lo = call i32 @llvm.amdgcn.mbcnt.lo(i32 -1, i32 0)
12 %tid = call i32 @llvm.amdgcn.mbcnt.hi(i32 -1, i32 %mbcnt.lo)
David Blaikie79e6c742015-02-27 19:29:02 +000013 %a_ptr = getelementptr [1025 x i32], [1025 x i32] addrspace(1)* %inA, i32 %tid, i32 0
14 %b_ptr = getelementptr i32, i32 addrspace(1)* %inB, i32 %tid
David Blaikiea79ac142015-02-27 21:17:42 +000015 %a = load i32, i32 addrspace(1)* %a_ptr
16 %b = load i32, i32 addrspace(1)* %b_ptr
Matt Arsenaultdbf9f312013-11-11 23:31:02 +000017 %result = add i32 %a, %b
18 store i32 %result, i32 addrspace(1)* %out
19 ret void
20}
Matt Arsenault88859102016-06-17 21:18:41 +000021
22attributes #0 = { nounwind readnone }