Tom Stellard | e88bbc3 | 2016-09-23 01:33:26 +0000 | [diff] [blame] | 1 | ; RUN: llc -mtriple=amdgcn--amdhsa -mcpu=kaveri -verify-machineinstrs < %s | FileCheck -check-prefixes=CO-V2,HSA,ALL,HSA-NOENV %s |
| 2 | ; RUN: llc -mtriple=amdgcn--amdhsa-opencl -mcpu=kaveri -verify-machineinstrs < %s | FileCheck -check-prefixes=CO-V2,HSA,ALL,HSA-OPENCL %s |
Tom Stellard | 0b76fc4c | 2016-09-16 21:34:26 +0000 | [diff] [blame] | 3 | ; RUN: llc -mtriple=amdgcn-mesa-mesa3d -verify-machineinstrs < %s | FileCheck -check-prefixes=CO-V2,OS-MESA3D,MESA,ALL %s |
| 4 | ; RUN: llc -mtriple=amdgcn-mesa-unknown -verify-machineinstrs < %s | FileCheck -check-prefixes=OS-UNKNOWN,MESA,ALL %s |
Yaxun Liu | a618acf | 2017-06-01 21:31:53 +0000 | [diff] [blame] | 5 | ; RUN: llc -mtriple=amdgcn--amdhsa-amdgiz -mcpu=kaveri -verify-machineinstrs < %s | FileCheck -check-prefixes=CO-V2,HSA,ALL,HSA-NOENV %s |
| 6 | ; RUN: llc -mtriple=amdgcn--amdhsa-amdgizcl -mcpu=kaveri -verify-machineinstrs < %s | FileCheck -check-prefixes=CO-V2,HSA,ALL,HSA-OPENCL %s |
Matt Arsenault | dc4ebad | 2016-04-29 21:16:52 +0000 | [diff] [blame] | 7 | |
| 8 | ; ALL-LABEL: {{^}}test: |
Tom Stellard | 0b76fc4c | 2016-09-16 21:34:26 +0000 | [diff] [blame] | 9 | ; CO-V2: enable_sgpr_kernarg_segment_ptr = 1 |
| 10 | ; CO-V2: s_load_dword s{{[0-9]+}}, s[4:5], 0xa |
Matt Arsenault | dc4ebad | 2016-04-29 21:16:52 +0000 | [diff] [blame] | 11 | |
Tom Stellard | 0b76fc4c | 2016-09-16 21:34:26 +0000 | [diff] [blame] | 12 | ; OS-UNKNOWN: s_load_dword s{{[0-9]+}}, s[0:1], 0xa |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 13 | define amdgpu_kernel void @test(i32 addrspace(1)* %out) #1 { |
Yaxun Liu | 0124b54 | 2018-02-13 18:00:25 +0000 | [diff] [blame] | 14 | %kernarg.segment.ptr = call noalias i8 addrspace(4)* @llvm.amdgcn.kernarg.segment.ptr() |
| 15 | %header.ptr = bitcast i8 addrspace(4)* %kernarg.segment.ptr to i32 addrspace(4)* |
| 16 | %gep = getelementptr i32, i32 addrspace(4)* %header.ptr, i64 10 |
| 17 | %value = load i32, i32 addrspace(4)* %gep |
Matt Arsenault | dc4ebad | 2016-04-29 21:16:52 +0000 | [diff] [blame] | 18 | store i32 %value, i32 addrspace(1)* %out |
| 19 | ret void |
| 20 | } |
| 21 | |
Jan Vesely | fea814d | 2016-06-21 20:46:20 +0000 | [diff] [blame] | 22 | ; ALL-LABEL: {{^}}test_implicit: |
| 23 | ; 10 + 9 (36 prepended implicit bytes) + 2(out pointer) = 21 = 0x15 |
Tom Stellard | 0b76fc4c | 2016-09-16 21:34:26 +0000 | [diff] [blame] | 24 | ; OS-UNKNOWN: s_load_dword s{{[0-9]+}}, s[0:1], 0x15 |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 25 | define amdgpu_kernel void @test_implicit(i32 addrspace(1)* %out) #1 { |
Yaxun Liu | 0124b54 | 2018-02-13 18:00:25 +0000 | [diff] [blame] | 26 | %implicitarg.ptr = call noalias i8 addrspace(4)* @llvm.amdgcn.implicitarg.ptr() |
| 27 | %header.ptr = bitcast i8 addrspace(4)* %implicitarg.ptr to i32 addrspace(4)* |
| 28 | %gep = getelementptr i32, i32 addrspace(4)* %header.ptr, i64 10 |
| 29 | %value = load i32, i32 addrspace(4)* %gep |
Jan Vesely | fea814d | 2016-06-21 20:46:20 +0000 | [diff] [blame] | 30 | store i32 %value, i32 addrspace(1)* %out |
| 31 | ret void |
| 32 | } |
| 33 | |
Tom Stellard | ba57308 | 2016-08-31 18:46:07 +0000 | [diff] [blame] | 34 | ; ALL-LABEL: {{^}}test_implicit_alignment |
Tom Stellard | e88bbc3 | 2016-09-23 01:33:26 +0000 | [diff] [blame] | 35 | ; HSA-NOENV: kernarg_segment_byte_size = 10 |
| 36 | ; HSA-OPENCL: kernarg_segment_byte_size = 48 |
| 37 | ; OS-MESA3D: kernarg_segment_byte_size = 28 |
Tom Stellard | 0b76fc4c | 2016-09-16 21:34:26 +0000 | [diff] [blame] | 38 | ; OS-UNKNOWN: s_load_dword [[VAL:s[0-9]+]], s[{{[0-9]+:[0-9]+}}], 0xc |
Tom Stellard | b2869eb | 2016-09-09 19:28:00 +0000 | [diff] [blame] | 39 | ; HSA: s_load_dword [[VAL:s[0-9]+]], s[{{[0-9]+:[0-9]+}}], 0x4 |
Tom Stellard | 0b76fc4c | 2016-09-16 21:34:26 +0000 | [diff] [blame] | 40 | ; OS-MESA3D: s_load_dword [[VAL:s[0-9]+]], s[{{[0-9]+:[0-9]+}}], 0x3 |
Tom Stellard | ba57308 | 2016-08-31 18:46:07 +0000 | [diff] [blame] | 41 | ; ALL: v_mov_b32_e32 [[V_VAL:v[0-9]+]], [[VAL]] |
| 42 | ; MESA: buffer_store_dword [[V_VAL]] |
| 43 | ; HSA: flat_store_dword v[{{[0-9]+:[0-9]+}}], [[V_VAL]] |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 44 | define amdgpu_kernel void @test_implicit_alignment(i32 addrspace(1)* %out, <2 x i8> %in) #1 { |
Yaxun Liu | 0124b54 | 2018-02-13 18:00:25 +0000 | [diff] [blame] | 45 | %implicitarg.ptr = call noalias i8 addrspace(4)* @llvm.amdgcn.implicitarg.ptr() |
| 46 | %arg.ptr = bitcast i8 addrspace(4)* %implicitarg.ptr to i32 addrspace(4)* |
| 47 | %val = load i32, i32 addrspace(4)* %arg.ptr |
Tom Stellard | ba57308 | 2016-08-31 18:46:07 +0000 | [diff] [blame] | 48 | store i32 %val, i32 addrspace(1)* %out |
| 49 | ret void |
| 50 | } |
| 51 | |
Matt Arsenault | 23e4df6 | 2017-07-14 00:11:13 +0000 | [diff] [blame] | 52 | ; ALL-LABEL: {{^}}test_no_kernargs: |
| 53 | ; HSA: enable_sgpr_kernarg_segment_ptr = 1 |
| 54 | ; HSA: s_load_dword s{{[0-9]+}}, s[4:5] |
| 55 | define amdgpu_kernel void @test_no_kernargs() #1 { |
Yaxun Liu | 0124b54 | 2018-02-13 18:00:25 +0000 | [diff] [blame] | 56 | %kernarg.segment.ptr = call noalias i8 addrspace(4)* @llvm.amdgcn.kernarg.segment.ptr() |
| 57 | %header.ptr = bitcast i8 addrspace(4)* %kernarg.segment.ptr to i32 addrspace(4)* |
| 58 | %gep = getelementptr i32, i32 addrspace(4)* %header.ptr, i64 10 |
| 59 | %value = load i32, i32 addrspace(4)* %gep |
Matt Arsenault | 23e4df6 | 2017-07-14 00:11:13 +0000 | [diff] [blame] | 60 | store volatile i32 %value, i32 addrspace(1)* undef |
| 61 | ret void |
| 62 | } |
| 63 | |
Yaxun Liu | 0124b54 | 2018-02-13 18:00:25 +0000 | [diff] [blame] | 64 | declare i8 addrspace(4)* @llvm.amdgcn.kernarg.segment.ptr() #0 |
| 65 | declare i8 addrspace(4)* @llvm.amdgcn.implicitarg.ptr() #0 |
Matt Arsenault | dc4ebad | 2016-04-29 21:16:52 +0000 | [diff] [blame] | 66 | |
| 67 | attributes #0 = { nounwind readnone } |
| 68 | attributes #1 = { nounwind } |