blob: 6694fda145f565f303a584204c5bf92c9c1e06f7 [file] [log] [blame]
Matt Arsenault813613c2018-09-04 18:58:19 +00001; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=fiji -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
2
3; GCN-LABEL: {{^}}private_load_maybe_divergent:
4; GCN: buffer_load_dword
5; GCN-NOT: s_load_dword s
6; GCN: flat_load_dword
7; GCN-NOT: s_load_dword s
8define amdgpu_kernel void @private_load_maybe_divergent(i32 addrspace(4)* %k, i32* %flat) {
9 %load = load volatile i32, i32 addrspace(5)* undef, align 4
10 %gep = getelementptr inbounds i32, i32 addrspace(4)* %k, i32 %load
11 %maybe.not.uniform.load = load i32, i32 addrspace(4)* %gep, align 4
12 store i32 %maybe.not.uniform.load, i32 addrspace(1)* undef
13 ret void
14}
15
16; GCN-LABEL: {{^}}flat_load_maybe_divergent:
17; GCN: s_load_dwordx4
18; GCN-NOT: s_load
19; GCN: flat_load_dword
20; GCN-NOT: s_load
21; GCN: flat_load_dword
22; GCN-NOT: s_load
23; GCN: flat_store_dword
24define amdgpu_kernel void @flat_load_maybe_divergent(i32 addrspace(4)* %k, i32* %flat) {
25 %load = load i32, i32* %flat, align 4
26 %gep = getelementptr inbounds i32, i32 addrspace(4)* %k, i32 %load
27 %maybe.not.uniform.load = load i32, i32 addrspace(4)* %gep, align 4
28 store i32 %maybe.not.uniform.load, i32 addrspace(1)* undef
29 ret void
30}