Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 1 | ; RUN: llc < %s -march=r600 -mcpu=redwood | FileCheck %s |
| 2 | |
| 3 | ; These tests check that floating point comparisons which are used by select |
| 4 | ; to store integer true (-1) and false (0) values are lowered to one of the |
| 5 | ; SET*DX10 instructions. |
| 6 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 7 | ; CHECK: {{^}}fcmp_une_select_fptosi: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 8 | ; CHECK: LSHR |
| 9 | ; CHECK-NEXT: SETNE_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, KC0[2].Z, literal.y, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 10 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 11 | define amdgpu_kernel void @fcmp_une_select_fptosi(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 12 | entry: |
| 13 | %0 = fcmp une float %in, 5.0 |
| 14 | %1 = select i1 %0, float 1.000000e+00, float 0.000000e+00 |
| 15 | %2 = fsub float -0.000000e+00, %1 |
| 16 | %3 = fptosi float %2 to i32 |
| 17 | store i32 %3, i32 addrspace(1)* %out |
| 18 | ret void |
| 19 | } |
| 20 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 21 | ; CHECK: {{^}}fcmp_une_select_i32: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 22 | ; CHECK: LSHR |
| 23 | ; CHECK-NEXT: SETNE_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, KC0[2].Z, literal.y, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 24 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 25 | define amdgpu_kernel void @fcmp_une_select_i32(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 26 | entry: |
| 27 | %0 = fcmp une float %in, 5.0 |
| 28 | %1 = select i1 %0, i32 -1, i32 0 |
| 29 | store i32 %1, i32 addrspace(1)* %out |
| 30 | ret void |
| 31 | } |
| 32 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 33 | ; CHECK: {{^}}fcmp_oeq_select_fptosi: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 34 | ; CHECK: LSHR |
| 35 | ; CHECK-NEXT: SETE_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, KC0[2].Z, literal.y, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 36 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 37 | define amdgpu_kernel void @fcmp_oeq_select_fptosi(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 38 | entry: |
Tom Stellard | 0351ea2 | 2013-09-28 02:50:50 +0000 | [diff] [blame] | 39 | %0 = fcmp oeq float %in, 5.0 |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 40 | %1 = select i1 %0, float 1.000000e+00, float 0.000000e+00 |
| 41 | %2 = fsub float -0.000000e+00, %1 |
| 42 | %3 = fptosi float %2 to i32 |
| 43 | store i32 %3, i32 addrspace(1)* %out |
| 44 | ret void |
| 45 | } |
| 46 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 47 | ; CHECK: {{^}}fcmp_oeq_select_i32: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 48 | ; CHECK: LSHR |
| 49 | ; CHECK-NEXT: SETE_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, KC0[2].Z, literal.y, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 50 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 51 | define amdgpu_kernel void @fcmp_oeq_select_i32(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 52 | entry: |
Tom Stellard | 0351ea2 | 2013-09-28 02:50:50 +0000 | [diff] [blame] | 53 | %0 = fcmp oeq float %in, 5.0 |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 54 | %1 = select i1 %0, i32 -1, i32 0 |
| 55 | store i32 %1, i32 addrspace(1)* %out |
| 56 | ret void |
| 57 | } |
| 58 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 59 | ; CHECK: {{^}}fcmp_ogt_select_fptosi: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 60 | ; CHECK: LSHR |
| 61 | ; CHECK-NEXT: SETGT_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, KC0[2].Z, literal.y, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 62 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 63 | define amdgpu_kernel void @fcmp_ogt_select_fptosi(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 64 | entry: |
Tom Stellard | 0351ea2 | 2013-09-28 02:50:50 +0000 | [diff] [blame] | 65 | %0 = fcmp ogt float %in, 5.0 |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 66 | %1 = select i1 %0, float 1.000000e+00, float 0.000000e+00 |
| 67 | %2 = fsub float -0.000000e+00, %1 |
| 68 | %3 = fptosi float %2 to i32 |
| 69 | store i32 %3, i32 addrspace(1)* %out |
| 70 | ret void |
| 71 | } |
| 72 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 73 | ; CHECK: {{^}}fcmp_ogt_select_i32: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 74 | ; CHECK: LSHR |
| 75 | ; CHECK-NEXT: SETGT_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, KC0[2].Z, literal.y, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 76 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 77 | define amdgpu_kernel void @fcmp_ogt_select_i32(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 78 | entry: |
Tom Stellard | 0351ea2 | 2013-09-28 02:50:50 +0000 | [diff] [blame] | 79 | %0 = fcmp ogt float %in, 5.0 |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 80 | %1 = select i1 %0, i32 -1, i32 0 |
| 81 | store i32 %1, i32 addrspace(1)* %out |
| 82 | ret void |
| 83 | } |
| 84 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 85 | ; CHECK: {{^}}fcmp_oge_select_fptosi: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 86 | ; CHECK: LSHR |
| 87 | ; CHECK-NEXT: SETGE_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, KC0[2].Z, literal.y, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 88 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 89 | define amdgpu_kernel void @fcmp_oge_select_fptosi(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 90 | entry: |
Tom Stellard | 0351ea2 | 2013-09-28 02:50:50 +0000 | [diff] [blame] | 91 | %0 = fcmp oge float %in, 5.0 |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 92 | %1 = select i1 %0, float 1.000000e+00, float 0.000000e+00 |
| 93 | %2 = fsub float -0.000000e+00, %1 |
| 94 | %3 = fptosi float %2 to i32 |
| 95 | store i32 %3, i32 addrspace(1)* %out |
| 96 | ret void |
| 97 | } |
| 98 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 99 | ; CHECK: {{^}}fcmp_oge_select_i32: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 100 | ; CHECK: LSHR |
| 101 | ; CHECK-NEXT: SETGE_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, KC0[2].Z, literal.y, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 102 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 103 | define amdgpu_kernel void @fcmp_oge_select_i32(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 104 | entry: |
Tom Stellard | 0351ea2 | 2013-09-28 02:50:50 +0000 | [diff] [blame] | 105 | %0 = fcmp oge float %in, 5.0 |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 106 | %1 = select i1 %0, i32 -1, i32 0 |
| 107 | store i32 %1, i32 addrspace(1)* %out |
| 108 | ret void |
| 109 | } |
| 110 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 111 | ; CHECK: {{^}}fcmp_ole_select_fptosi: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 112 | ; CHECK: LSHR |
| 113 | ; CHECK-NEXT: SETGE_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, literal.y, KC0[2].Z, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 114 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 115 | define amdgpu_kernel void @fcmp_ole_select_fptosi(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 116 | entry: |
Tom Stellard | 0351ea2 | 2013-09-28 02:50:50 +0000 | [diff] [blame] | 117 | %0 = fcmp ole float %in, 5.0 |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 118 | %1 = select i1 %0, float 1.000000e+00, float 0.000000e+00 |
| 119 | %2 = fsub float -0.000000e+00, %1 |
| 120 | %3 = fptosi float %2 to i32 |
| 121 | store i32 %3, i32 addrspace(1)* %out |
| 122 | ret void |
| 123 | } |
| 124 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 125 | ; CHECK: {{^}}fcmp_ole_select_i32: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 126 | ; CHECK: LSHR |
| 127 | ; CHECK-NEXT: SETGE_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, literal.y, KC0[2].Z, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 128 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 129 | define amdgpu_kernel void @fcmp_ole_select_i32(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 130 | entry: |
Tom Stellard | 0351ea2 | 2013-09-28 02:50:50 +0000 | [diff] [blame] | 131 | %0 = fcmp ole float %in, 5.0 |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 132 | %1 = select i1 %0, i32 -1, i32 0 |
| 133 | store i32 %1, i32 addrspace(1)* %out |
| 134 | ret void |
| 135 | } |
| 136 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 137 | ; CHECK: {{^}}fcmp_olt_select_fptosi: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 138 | ; CHECK: LSHR |
| 139 | ; CHECK-NEXT: SETGT_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, literal.y, KC0[2].Z, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 140 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 141 | define amdgpu_kernel void @fcmp_olt_select_fptosi(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 142 | entry: |
Tom Stellard | 0351ea2 | 2013-09-28 02:50:50 +0000 | [diff] [blame] | 143 | %0 = fcmp olt float %in, 5.0 |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 144 | %1 = select i1 %0, float 1.000000e+00, float 0.000000e+00 |
| 145 | %2 = fsub float -0.000000e+00, %1 |
| 146 | %3 = fptosi float %2 to i32 |
| 147 | store i32 %3, i32 addrspace(1)* %out |
| 148 | ret void |
| 149 | } |
| 150 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 151 | ; CHECK: {{^}}fcmp_olt_select_i32: |
Matthias Braun | 97d0ffb | 2015-12-04 01:51:19 +0000 | [diff] [blame] | 152 | ; CHECK: LSHR |
| 153 | ; CHECK-NEXT: SETGT_DX10 * {{\** *}}T{{[0-9]+\.[XYZW]}}, literal.y, KC0[2].Z, |
Vincent Lejeune | f97af79 | 2013-05-02 21:52:30 +0000 | [diff] [blame] | 154 | ; CHECK-NEXT: 1084227584(5.000000e+00) |
Matt Arsenault | 3dbeefa | 2017-03-21 21:39:51 +0000 | [diff] [blame] | 155 | define amdgpu_kernel void @fcmp_olt_select_i32(i32 addrspace(1)* %out, float %in) { |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 156 | entry: |
Tom Stellard | 0351ea2 | 2013-09-28 02:50:50 +0000 | [diff] [blame] | 157 | %0 = fcmp olt float %in, 5.0 |
Tom Stellard | e06163a | 2013-02-07 14:02:35 +0000 | [diff] [blame] | 158 | %1 = select i1 %0, i32 -1, i32 0 |
| 159 | store i32 %1, i32 addrspace(1)* %out |
| 160 | ret void |
| 161 | } |