| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 1 | ; RUN: llc -mtriple=thumbv8.main -mcpu=cortex-m33 %s -arm-disable-cgp=false -o - | FileCheck %s --check-prefix=CHECK-COMMON --check-prefix=CHECK-NODSP |
| 2 | ; RUN: llc -mtriple=thumbv7-linux-android %s -arm-disable-cgp=false -o - | FileCheck %s --check-prefix=CHECK-COMMON --check-prefix=CHECK-NODSP |
| 3 | ; RUN: llc -mtriple=thumbv7em %s -arm-disable-cgp=false -arm-enable-scalar-dsp=true -o - | FileCheck %s --check-prefix=CHECK-COMMON --check-prefix=CHECK-DSP |
| 4 | ; RUN: llc -mtriple=thumbv8 %s -arm-disable-cgp=false -arm-enable-scalar-dsp=true -arm-enable-scalar-dsp-imms=true -o - | FileCheck %s --check-prefix=CHECK-COMMON --check-prefix=CHECK-DSP-IMM |
| 5 | |
| 6 | ; Transform will fail because the trunc is not a sink. |
| 7 | ; CHECK-COMMON-LABEL: dsp_trunc |
| 8 | ; CHECK-COMMON: add [[ADD:[^ ]+]], |
| 9 | ; CHECK-DSP-NEXT: ldrh r1, [r3] |
| 10 | ; CHECK-DSP-NEXT: ldrh r2, [r2] |
| 11 | ; CHECK-DSP-NEXT: subs r1, r1, [[ADD]] |
| 12 | ; CHECK-DSP-NEXT: add r0, r2 |
| 13 | ; CHECK-DSP-NEXT: uxth r3, r1 |
| 14 | ; CHECK-DSP-NEXT: uxth r2, r0 |
| 15 | ; CHECK-DSP-NEXT: cmp r2, r3 |
| 16 | |
| 17 | ; With DSP-IMM, we could have: |
| 18 | ; movs r1, #0 |
| 19 | ; uxth r0, r0 |
| 20 | ; usub16 r1, r1, r0 |
| 21 | ; ldrh r0, [r2] |
| 22 | ; ldrh r3, [r3] |
| 23 | ; usub16 r0, r0, r1 |
| 24 | ; uadd16 r1, r3, r1 |
| 25 | ; cmp r0, r1 |
| 26 | define i16 @dsp_trunc(i32 %arg0, i32 %arg1, i16* %gep0, i16* %gep1) { |
| 27 | entry: |
| 28 | %add0 = add i32 %arg0, %arg1 |
| 29 | %conv0 = trunc i32 %add0 to i16 |
| 30 | %sub0 = sub i16 0, %conv0 |
| 31 | %load0 = load i16, i16* %gep0, align 2 |
| 32 | %load1 = load i16, i16* %gep1, align 2 |
| 33 | %sub1 = sub i16 %load0, %sub0 |
| 34 | %add1 = add i16 %load1, %sub0 |
| 35 | %cmp = icmp ult i16 %sub1, %add1 |
| 36 | %res = select i1 %cmp, i16 %add1, i16 %sub1 |
| 37 | ret i16 %res |
| 38 | } |
| 39 | |
| 40 | ; CHECK-COMMON-LABEL: trunc_i16_i8 |
| 41 | ; CHECK-COMMON: ldrh |
| 42 | ; CHECK-COMMON: uxtb |
| 43 | ; CHECK-COMMON: cmp |
| 44 | define i8 @trunc_i16_i8(i16* %ptr, i16 zeroext %arg0, i8 zeroext %arg1) { |
| 45 | entry: |
| 46 | %0 = load i16, i16* %ptr |
| 47 | %1 = add i16 %0, %arg0 |
| 48 | %2 = trunc i16 %1 to i8 |
| 49 | %3 = icmp ugt i8 %2, %arg1 |
| 50 | %4 = select i1 %3, i8 %2, i8 %arg1 |
| 51 | ret i8 %4 |
| 52 | } |
| 53 | |
| Sam Parker | 0e2f0bd | 2018-08-16 11:54:09 +0000 | [diff] [blame] | 54 | ; The pass perform the transform, but a uxtb will still be inserted to handle |
| 55 | ; the zext to the icmp. |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 56 | ; CHECK-COMMON-LABEL: icmp_i32_zext: |
| Sam Parker | 0e2f0bd | 2018-08-16 11:54:09 +0000 | [diff] [blame] | 57 | ; CHECK-COMMON: sub |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 58 | ; CHECK-COMMON: uxtb |
| Sam Parker | 0e2f0bd | 2018-08-16 11:54:09 +0000 | [diff] [blame] | 59 | ; CHECK-COMMON: cmp |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 60 | define i8 @icmp_i32_zext(i8* %ptr) { |
| 61 | entry: |
| 62 | %gep = getelementptr inbounds i8, i8* %ptr, i32 0 |
| 63 | %0 = load i8, i8* %gep, align 1 |
| 64 | %1 = sub nuw nsw i8 %0, 1 |
| 65 | %conv44 = zext i8 %0 to i32 |
| 66 | br label %preheader |
| 67 | |
| 68 | preheader: |
| 69 | br label %body |
| 70 | |
| 71 | body: |
| 72 | %2 = phi i8 [ %1, %preheader ], [ %3, %if.end ] |
| 73 | %si.0274 = phi i32 [ %conv44, %preheader ], [ %inc, %if.end ] |
| 74 | %conv51266 = zext i8 %2 to i32 |
| 75 | %cmp52267 = icmp eq i32 %si.0274, %conv51266 |
| 76 | br i1 %cmp52267, label %if.end, label %exit |
| 77 | |
| 78 | if.end: |
| 79 | %inc = add i32 %si.0274, 1 |
| 80 | %gep1 = getelementptr inbounds i8, i8* %ptr, i32 %inc |
| 81 | %3 = load i8, i8* %gep1, align 1 |
| 82 | br label %body |
| 83 | |
| 84 | exit: |
| 85 | ret i8 %2 |
| 86 | } |
| 87 | |
| Sam Parker | 481cdab | 2018-09-17 13:57:39 +0000 | [diff] [blame^] | 88 | ; TODO: We should be able to remove both extends from this example, by looking |
| 89 | ; back through the zexts and accepting a type size <= than the icmp. |
| 90 | ; CHECK-COMMON-LABEL: icmp_i16_zext |
| 91 | ; CHECK-COMMON: uxt |
| 92 | ; CHECK-COMMON: uxt |
| 93 | define i8 @icmp_i16_zext(i8* %ptr) { |
| 94 | entry: |
| 95 | %gep = getelementptr inbounds i8, i8* %ptr, i32 0 |
| 96 | %0 = load i8, i8* %gep, align 1 |
| 97 | %1 = sub nuw nsw i8 %0, 1 |
| 98 | %conv44 = zext i8 %0 to i16 |
| 99 | br label %preheader |
| 100 | |
| 101 | preheader: |
| 102 | br label %body |
| 103 | |
| 104 | body: |
| 105 | %2 = phi i8 [ %1, %preheader ], [ %3, %if.end ] |
| 106 | %si.0274 = phi i16 [ %conv44, %preheader ], [ %inc, %if.end ] |
| 107 | %conv51266 = zext i8 %2 to i16 |
| 108 | %cmp52267 = icmp eq i16 %si.0274, %conv51266 |
| 109 | br i1 %cmp52267, label %if.end, label %exit |
| 110 | |
| 111 | if.end: |
| 112 | %inc = add nuw i16 %si.0274, 1 |
| 113 | %conv = zext i16 %inc to i32 |
| 114 | %gep1 = getelementptr inbounds i8, i8* %ptr, i32 %conv |
| 115 | %3 = load i8, i8* %gep1, align 1 |
| 116 | br label %body |
| 117 | |
| 118 | exit: |
| 119 | ret i8 %2 |
| 120 | } |
| 121 | |
| Sam Parker | 0e2f0bd | 2018-08-16 11:54:09 +0000 | [diff] [blame] | 122 | ; Won't don't handle sext |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 123 | ; CHECK-COMMON-LABEL: icmp_sext_zext_store_i8_i16 |
| Sam Parker | 0e2f0bd | 2018-08-16 11:54:09 +0000 | [diff] [blame] | 124 | ; CHECK-COMMON: ldrb |
| 125 | ; CHECK-COMMON: ldrsh |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 126 | define i32 @icmp_sext_zext_store_i8_i16() { |
| 127 | entry: |
| 128 | %0 = load i8, i8* getelementptr inbounds ([16 x i8], [16 x i8]* @d_uch, i32 0, i32 2), align 1 |
| 129 | %conv = zext i8 %0 to i16 |
| 130 | store i16 %conv, i16* @sh1, align 2 |
| 131 | %conv1 = zext i8 %0 to i32 |
| 132 | %1 = load i16, i16* getelementptr inbounds ([16 x i16], [16 x i16]* @d_sh, i32 0, i32 2), align 2 |
| 133 | %conv2 = sext i16 %1 to i32 |
| 134 | %cmp = icmp eq i32 %conv1, %conv2 |
| 135 | %conv3 = zext i1 %cmp to i32 |
| 136 | ret i32 %conv3 |
| 137 | } |
| 138 | |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 139 | ; CHECK-COMMON-LABEL: or_icmp_ugt: |
| Sam Parker | 0e2f0bd | 2018-08-16 11:54:09 +0000 | [diff] [blame] | 140 | ; CHECK-COMMON: ldrb |
| 141 | ; CHECK-COMMON: sub.w |
| 142 | ; CHECK-COMMON-NOT: uxt |
| 143 | ; CHECK-COMMON: cmp.w |
| 144 | ; CHECK-COMMON-NOT: uxt |
| 145 | ; CHECK-COMMON: cmp |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 146 | define i1 @or_icmp_ugt(i32 %arg, i8* %ptr) { |
| 147 | entry: |
| 148 | %0 = load i8, i8* %ptr |
| 149 | %1 = zext i8 %0 to i32 |
| 150 | %mul = shl nuw nsw i32 %1, 1 |
| 151 | %add0 = add nuw nsw i32 %mul, 6 |
| 152 | %cmp0 = icmp ne i32 %arg, %add0 |
| 153 | %add1 = add i8 %0, -1 |
| 154 | %cmp1 = icmp ugt i8 %add1, 3 |
| 155 | %or = or i1 %cmp0, %cmp1 |
| 156 | ret i1 %or |
| 157 | } |
| 158 | |
| 159 | ; CHECK-COMMON-LABEL: icmp_switch_trunc: |
| 160 | ; CHECK-COMMON-NOT: uxt |
| 161 | define i16 @icmp_switch_trunc(i16 zeroext %arg) { |
| 162 | entry: |
| 163 | %conv = add nuw i16 %arg, 15 |
| 164 | %mul = mul nuw nsw i16 %conv, 3 |
| 165 | %trunc = trunc i16 %arg to i3 |
| 166 | switch i3 %trunc, label %default [ |
| 167 | i3 0, label %sw.bb |
| 168 | i3 1, label %sw.bb.i |
| 169 | ] |
| 170 | |
| 171 | sw.bb: |
| 172 | %cmp0 = icmp ult i16 %mul, 127 |
| 173 | %select = select i1 %cmp0, i16 %mul, i16 127 |
| 174 | br label %exit |
| 175 | |
| 176 | sw.bb.i: |
| 177 | %cmp1 = icmp ugt i16 %mul, 34 |
| 178 | %select.i = select i1 %cmp1, i16 %mul, i16 34 |
| 179 | br label %exit |
| 180 | |
| 181 | default: |
| 182 | br label %exit |
| 183 | |
| 184 | exit: |
| 185 | %res = phi i16 [ %select, %sw.bb ], [ %select.i, %sw.bb.i ], [ %mul, %default ] |
| 186 | ret i16 %res |
| 187 | } |
| 188 | |
| Sam Parker | 0e2f0bd | 2018-08-16 11:54:09 +0000 | [diff] [blame] | 189 | ; We currently only handle truncs as sinks, so a uxt will still be needed for |
| 190 | ; the icmp ugt instruction. |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 191 | ; CHECK-COMMON-LABEL: urem_trunc_icmps |
| Sam Parker | 0e2f0bd | 2018-08-16 11:54:09 +0000 | [diff] [blame] | 192 | ; CHECK-COMMON: cmp |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 193 | ; CHECK-COMMON: uxt |
| Sam Parker | 0e2f0bd | 2018-08-16 11:54:09 +0000 | [diff] [blame] | 194 | ; CHECK-COMMON: cmp |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 195 | define void @urem_trunc_icmps(i16** %in, i32* %g, i32* %k) { |
| 196 | entry: |
| 197 | %ptr = load i16*, i16** %in, align 4 |
| 198 | %ld = load i16, i16* %ptr, align 2 |
| 199 | %cmp.i = icmp eq i16 %ld, 0 |
| 200 | br i1 %cmp.i, label %exit, label %cond.false.i |
| 201 | |
| 202 | cond.false.i: |
| 203 | %rem = urem i16 5, %ld |
| 204 | %extract.t = trunc i16 %rem to i8 |
| 205 | br label %body |
| 206 | |
| 207 | body: |
| 208 | %cond.in.i.off0 = phi i8 [ %extract.t, %cond.false.i ], [ %add, %for.inc ] |
| 209 | %cmp = icmp ugt i8 %cond.in.i.off0, 7 |
| 210 | %conv5 = zext i1 %cmp to i32 |
| 211 | store i32 %conv5, i32* %g, align 4 |
| 212 | %.pr = load i32, i32* %k, align 4 |
| 213 | %tobool13150 = icmp eq i32 %.pr, 0 |
| 214 | br i1 %tobool13150, label %for.inc, label %exit |
| 215 | |
| 216 | for.inc: |
| 217 | %add = add nuw i8 %cond.in.i.off0, 1 |
| 218 | br label %body |
| 219 | |
| 220 | exit: |
| 221 | ret void |
| 222 | } |
| 223 | |
| 224 | ; CHECK-COMMON-LABEL: phi_feeding_switch |
| 225 | ; CHECK-COMMON: ldrb |
| 226 | ; CHECK-COMMON: uxtb |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 227 | define void @phi_feeding_switch(i8* %memblock, i8* %store, i16 %arg) { |
| 228 | entry: |
| 229 | %pre = load i8, i8* %memblock, align 1 |
| 230 | %conv = trunc i16 %arg to i8 |
| 231 | br label %header |
| 232 | |
| 233 | header: |
| 234 | %phi.0 = phi i8 [ %pre, %entry ], [ %count, %latch ] |
| 235 | %phi.1 = phi i8 [ %conv, %entry ], [ %phi.3, %latch ] |
| 236 | %phi.2 = phi i8 [ 0, %entry], [ %count, %latch ] |
| 237 | switch i8 %phi.0, label %default [ |
| 238 | i8 43, label %for.inc.i |
| 239 | i8 45, label %for.inc.i.i |
| 240 | ] |
| 241 | |
| 242 | for.inc.i: |
| 243 | %xor = xor i8 %phi.1, 1 |
| 244 | br label %latch |
| 245 | |
| 246 | for.inc.i.i: |
| 247 | %and = and i8 %phi.1, 3 |
| 248 | br label %latch |
| 249 | |
| 250 | default: |
| 251 | %sub = sub i8 %phi.0, 1 |
| 252 | %cmp2 = icmp ugt i8 %sub, 4 |
| 253 | br i1 %cmp2, label %latch, label %exit |
| 254 | |
| 255 | latch: |
| 256 | %phi.3 = phi i8 [ %xor, %for.inc.i ], [ %and, %for.inc.i.i ], [ %phi.2, %default ] |
| 257 | %count = add nuw i8 %phi.2, 1 |
| 258 | store i8 %count, i8* %store, align 1 |
| 259 | br label %header |
| 260 | |
| 261 | exit: |
| 262 | ret void |
| 263 | } |
| 264 | |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 265 | ; Check that %exp requires uxth in all cases, and will also be required to |
| 266 | ; promote %1 for the call - unless we can generate a uadd16. |
| 267 | ; CHECK-COMMON-LABEL: zext_load_sink_call: |
| 268 | ; CHECK-COMMON: uxt |
| 269 | ; uadd16 |
| 270 | ; cmp |
| 271 | ; CHECK-COMMON: uxt |
| 272 | define i32 @zext_load_sink_call(i16* %ptr, i16 %exp) { |
| 273 | entry: |
| 274 | %0 = load i16, i16* %ptr, align 4 |
| 275 | %1 = add i16 %exp, 3 |
| 276 | %cmp = icmp eq i16 %0, %exp |
| 277 | br i1 %cmp, label %exit, label %if.then |
| 278 | |
| 279 | if.then: |
| 280 | %conv0 = zext i16 %0 to i32 |
| 281 | %conv1 = zext i16 %1 to i32 |
| 282 | %call = tail call arm_aapcs_vfpcc i32 @dummy(i32 %conv0, i32 %conv1) |
| 283 | br label %exit |
| 284 | |
| 285 | exit: |
| 286 | %exitval = phi i32 [ %call, %if.then ], [ 0, %entry ] |
| 287 | ret i32 %exitval |
| 288 | } |
| 289 | |
| 290 | %class.ae = type { i8 } |
| 291 | %class.x = type { i8 } |
| 292 | %class.v = type { %class.q } |
| 293 | %class.q = type { i16 } |
| 294 | |
| 295 | ; CHECK-COMMON-LABEL: trunc_i16_i9_switch |
| 296 | ; CHECK-COMMON-NOT: uxt |
| 297 | define i32 @trunc_i16_i9_switch(%class.ae* %this) { |
| 298 | entry: |
| 299 | %call = tail call %class.x* @_ZNK2ae2afEv(%class.ae* %this) |
| 300 | %call2 = tail call %class.v* @_ZN1x2acEv(%class.x* %call) |
| 301 | %0 = getelementptr inbounds %class.v, %class.v* %call2, i32 0, i32 0, i32 0 |
| 302 | %1 = load i16, i16* %0, align 2 |
| 303 | %2 = trunc i16 %1 to i9 |
| 304 | %trunc = and i9 %2, -64 |
| 305 | switch i9 %trunc, label %cleanup.fold.split [ |
| 306 | i9 0, label %cleanup |
| 307 | i9 -256, label %if.then7 |
| 308 | ] |
| 309 | |
| 310 | if.then7: |
| 311 | %3 = and i16 %1, 7 |
| 312 | %tobool = icmp eq i16 %3, 0 |
| 313 | %cond = select i1 %tobool, i32 2, i32 1 |
| 314 | br label %cleanup |
| 315 | |
| 316 | cleanup.fold.split: |
| 317 | br label %cleanup |
| 318 | |
| 319 | cleanup: |
| 320 | %retval.0 = phi i32 [ %cond, %if.then7 ], [ 0, %entry ], [ 2, %cleanup.fold.split ] |
| 321 | ret i32 %retval.0 |
| 322 | } |
| 323 | |
| Sam Parker | 569b245 | 2018-09-12 09:11:48 +0000 | [diff] [blame] | 324 | ; CHECK-COMMON-LABEL: bitcast_i16 |
| 325 | ; CHECK-COMMON-NOT: uxt |
| 326 | define i16 @bitcast_i16(i16 zeroext %arg0, i16 zeroext %arg1) { |
| 327 | entry: |
| 328 | %cast = bitcast i16 12345 to i16 |
| 329 | %add = add nuw i16 %arg0, 1 |
| 330 | %cmp = icmp ule i16 %add, %cast |
| 331 | %res = select i1 %cmp, i16 %arg1, i16 32657 |
| 332 | ret i16 %res |
| 333 | } |
| 334 | |
| 335 | ; CHECK-COMMON-LABEL: bitcast_i8 |
| 336 | ; CHECK-COMMON-NOT: uxt |
| 337 | define i8 @bitcast_i8(i8 zeroext %arg0, i8 zeroext %arg1) { |
| 338 | entry: |
| 339 | %cast = bitcast i8 127 to i8 |
| 340 | %mul = shl nuw i8 %arg0, 1 |
| 341 | %cmp = icmp uge i8 %mul, %arg1 |
| 342 | %res = select i1 %cmp, i8 %cast, i8 128 |
| 343 | ret i8 %res |
| 344 | } |
| 345 | |
| 346 | ; CHECK-COMMON-LABEL: bitcast_i16_minus |
| 347 | ; CHECK-COMMON-NOT: uxt |
| 348 | define i16 @bitcast_i16_minus(i16 zeroext %arg0, i16 zeroext %arg1) { |
| 349 | entry: |
| 350 | %cast = bitcast i16 -12345 to i16 |
| 351 | %xor = xor i16 %arg0, 7 |
| 352 | %cmp = icmp eq i16 %xor, %arg1 |
| 353 | %res = select i1 %cmp, i16 %cast, i16 32657 |
| 354 | ret i16 %res |
| 355 | } |
| 356 | |
| 357 | ; CHECK-COMMON-LABEL: bitcast_i8_minus |
| 358 | ; CHECK-COMMON-NOT: uxt |
| 359 | define i8 @bitcast_i8_minus(i8 zeroext %arg0, i8 zeroext %arg1) { |
| 360 | entry: |
| 361 | %cast = bitcast i8 -127 to i8 |
| 362 | %and = and i8 %arg0, 3 |
| 363 | %cmp = icmp ne i8 %and, %arg1 |
| 364 | %res = select i1 %cmp, i8 %cast, i8 128 |
| 365 | ret i8 %res |
| 366 | } |
| 367 | |
| Sam Parker | 8c4b964 | 2018-08-10 13:57:13 +0000 | [diff] [blame] | 368 | declare %class.x* @_ZNK2ae2afEv(%class.ae*) local_unnamed_addr |
| 369 | declare %class.v* @_ZN1x2acEv(%class.x*) local_unnamed_addr |
| 370 | declare i32 @dummy(i32, i32) |
| 371 | |
| 372 | @d_uch = hidden local_unnamed_addr global [16 x i8] zeroinitializer, align 1 |
| 373 | @sh1 = hidden local_unnamed_addr global i16 0, align 2 |
| 374 | @d_sh = hidden local_unnamed_addr global [16 x i16] zeroinitializer, align 2 |