| Changpeng Fang | b41574a | 2015-12-22 20:55:23 +0000 | [diff] [blame] | 1 | ; RUN: llc -march=amdgcn -mcpu=kaveri -mtriple=amdgcn-unknown-amdhsa -mattr=-flat-for-global < %s | FileCheck -check-prefix=GCN %s |
| Matt Arsenault | 68d9386 | 2015-09-24 08:36:14 +0000 | [diff] [blame] | 2 | |
| 3 | ; Check that when mubuf addr64 instruction is handled in moveToVALU |
| 4 | ; from the pointer, dead register writes are not emitted. |
| 5 | |
| 6 | ; FIXME: We should be able to use the SGPR directly as src0 to v_add_i32 |
| 7 | |
| 8 | ; GCN-LABEL: {{^}}clobber_vgpr_pair_pointer_add: |
| Matt Arsenault | 7f9eabd | 2016-05-21 03:55:07 +0000 | [diff] [blame] | 9 | ; GCN-DAG: s_load_dwordx2 s{{\[}}[[ARG1LO:[0-9]+]]:[[ARG1HI:[0-9]+]]{{\]}}, s{{\[[0-9]+:[0-9]+\]}}, 0x0{{$}} |
| Tom Stellard | cb6ba62 | 2016-04-30 00:23:06 +0000 | [diff] [blame] | 10 | ; GCN-DAG: buffer_load_dwordx2 v{{\[}}[[LDPTRLO:[0-9]+]]:[[LDPTRHI:[0-9]+]]{{\]}} |
| Matt Arsenault | 68d9386 | 2015-09-24 08:36:14 +0000 | [diff] [blame] | 11 | |
| 12 | ; GCN-NOT: v_mov_b32 |
| Matthias Braun | 6ad3d05 | 2016-06-25 00:23:00 +0000 | [diff] [blame] | 13 | ; GCN: v_mov_b32_e32 v[[VARG1LO:[0-9]+]], s[[ARG1LO]] |
| 14 | ; GCN-NOT: v_mov_b32 |
| Tom Stellard | 0d23ebe | 2016-08-29 19:42:52 +0000 | [diff] [blame] | 15 | ; GCN: v_mov_b32_e32 v[[VARG1HI:[0-9]+]], s[[ARG1HI]] |
| 16 | ; GCN-NOT: v_mov_b32 |
| Matt Arsenault | 68d9386 | 2015-09-24 08:36:14 +0000 | [diff] [blame] | 17 | |
| 18 | ; GCN: v_add_i32_e32 v[[PTRLO:[0-9]+]], vcc, v[[LDPTRLO]], v[[VARG1LO]] |
| 19 | ; GCN: v_addc_u32_e32 v[[PTRHI:[0-9]+]], vcc, v[[LDPTRHI]], v[[VARG1HI]] |
| 20 | ; GCN: buffer_load_ubyte v{{[0-9]+}}, v{{\[}}[[PTRLO]]:[[PTRHI]]{{\]}}, |
| 21 | |
| Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 22 | define amdgpu_kernel void @clobber_vgpr_pair_pointer_add(i64 %arg1, i8 addrspace(1)* addrspace(1)* %ptrarg, i32 %arg3) #0 { |
| Matt Arsenault | 68d9386 | 2015-09-24 08:36:14 +0000 | [diff] [blame] | 23 | bb: |
| 24 | %tmp = icmp sgt i32 %arg3, 0 |
| 25 | br i1 %tmp, label %bb4, label %bb17 |
| 26 | |
| 27 | bb4: |
| 28 | %tmp14 = load volatile i8 addrspace(1)*, i8 addrspace(1)* addrspace(1)* %ptrarg |
| 29 | %tmp15 = getelementptr inbounds i8, i8 addrspace(1)* %tmp14, i64 %arg1 |
| 30 | %tmp16 = load volatile i8, i8 addrspace(1)* %tmp15 |
| 31 | br label %bb17 |
| 32 | |
| 33 | bb17: |
| 34 | ret void |
| 35 | } |
| 36 | |
| 37 | attributes #0 = { nounwind } |