Matt Arsenault | 4bf43d4 | 2015-09-25 17:27:08 +0000 | [diff] [blame] | 1 | ; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s |
| 2 | |
| 3 | ; How the replacement of i64 stores with v2i32 stores resulted in |
| 4 | ; breaking other users of the bitcast if they already existed |
| 5 | |
| 6 | ; GCN-LABEL: {{^}}extract_vector_elt_select_error: |
| 7 | ; GCN: buffer_store_dword |
| 8 | ; GCN: buffer_store_dword |
| 9 | ; GCN: buffer_store_dwordx2 |
| 10 | define void @extract_vector_elt_select_error(i32 addrspace(1)* %out, i64 addrspace(1)* %in, i64 %val) nounwind { |
| 11 | %vec = bitcast i64 %val to <2 x i32> |
| 12 | %elt0 = extractelement <2 x i32> %vec, i32 0 |
| 13 | %elt1 = extractelement <2 x i32> %vec, i32 1 |
| 14 | |
| 15 | store volatile i32 %elt0, i32 addrspace(1)* %out |
| 16 | store volatile i32 %elt1, i32 addrspace(1)* %out |
| 17 | store volatile i64 %val, i64 addrspace(1)* %in |
| 18 | ret void |
| 19 | } |
Matt Arsenault | 61001bb | 2015-11-25 19:58:34 +0000 | [diff] [blame] | 20 | |
| 21 | |
| 22 | define void @extract_vector_elt_v2i64(i64 addrspace(1)* %out, <2 x i64> %foo) nounwind { |
| 23 | %p0 = extractelement <2 x i64> %foo, i32 0 |
| 24 | %p1 = extractelement <2 x i64> %foo, i32 1 |
| 25 | %out1 = getelementptr i64, i64 addrspace(1)* %out, i32 1 |
| 26 | store volatile i64 %p1, i64 addrspace(1)* %out |
| 27 | store volatile i64 %p0, i64 addrspace(1)* %out1 |
| 28 | ret void |
| 29 | } |
| 30 | |
| 31 | define void @dyn_extract_vector_elt_v2i64(i64 addrspace(1)* %out, <2 x i64> %foo, i32 %elt) nounwind { |
| 32 | %dynelt = extractelement <2 x i64> %foo, i32 %elt |
| 33 | store volatile i64 %dynelt, i64 addrspace(1)* %out |
| 34 | ret void |
| 35 | } |
| 36 | |
| 37 | define void @dyn_extract_vector_elt_v2i64_2(i64 addrspace(1)* %out, <2 x i64> addrspace(1)* %foo, i32 %elt, <2 x i64> %arst) nounwind { |
| 38 | %load = load volatile <2 x i64>, <2 x i64> addrspace(1)* %foo |
| 39 | %or = or <2 x i64> %load, %arst |
| 40 | %dynelt = extractelement <2 x i64> %or, i32 %elt |
| 41 | store volatile i64 %dynelt, i64 addrspace(1)* %out |
| 42 | ret void |
| 43 | } |