Peter Collingbourne | 913869b | 2012-05-28 21:48:37 +0000 | [diff] [blame] | 1 | ; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s |
| 2 | ; RUN: llc < %s -march=nvptx64 -mcpu=sm_20 | FileCheck %s |
| 3 | |
Justin Lebar | 50071f6 | 2017-01-15 16:54:57 +0000 | [diff] [blame] | 4 | ; CHECK-LABEL test_fabsf( |
| 5 | define float @test_fabsf(float %f) { |
| 6 | ; CHECK: abs.f32 |
| 7 | %x = call float @llvm.fabs.f32(float %f) |
| 8 | ret float %x |
Peter Collingbourne | 913869b | 2012-05-28 21:48:37 +0000 | [diff] [blame] | 9 | } |
| 10 | |
Justin Lebar | 50071f6 | 2017-01-15 16:54:57 +0000 | [diff] [blame] | 11 | ; CHECK-LABEL: test_fabs( |
| 12 | define double @test_fabs(double %d) { |
| 13 | ; CHECK: abs.f64 |
| 14 | %x = call double @llvm.fabs.f64(double %d) |
| 15 | ret double %x |
Peter Collingbourne | 913869b | 2012-05-28 21:48:37 +0000 | [diff] [blame] | 16 | } |
| 17 | |
Justin Lebar | 50071f6 | 2017-01-15 16:54:57 +0000 | [diff] [blame] | 18 | ; CHECK-LABEL: test_nvvm_sqrt( |
Justin Holewinski | 48f4ad3 | 2013-05-21 16:51:30 +0000 | [diff] [blame] | 19 | define float @test_nvvm_sqrt(float %a) { |
Justin Lebar | 50071f6 | 2017-01-15 16:54:57 +0000 | [diff] [blame] | 20 | ; CHECK: sqrt.rn.f32 |
Justin Holewinski | 48f4ad3 | 2013-05-21 16:51:30 +0000 | [diff] [blame] | 21 | %val = call float @llvm.nvvm.sqrt.f(float %a) |
| 22 | ret float %val |
| 23 | } |
| 24 | |
Justin Lebar | c7d2012 | 2017-01-18 00:08:10 +0000 | [diff] [blame] | 25 | ; CHECK-LABEL: test_bitreverse32( |
| 26 | define i32 @test_bitreverse32(i32 %a) { |
| 27 | ; CHECK: brev.b32 |
| 28 | %val = call i32 @llvm.bitreverse.i32(i32 %a) |
| 29 | ret i32 %val |
| 30 | } |
| 31 | |
| 32 | ; CHECK-LABEL: test_bitreverse64( |
| 33 | define i64 @test_bitreverse64(i64 %a) { |
| 34 | ; CHECK: brev.b64 |
| 35 | %val = call i64 @llvm.bitreverse.i64(i64 %a) |
| 36 | ret i64 %val |
| 37 | } |
| 38 | |
Justin Lebar | 1091a9f | 2017-01-18 00:08:27 +0000 | [diff] [blame^] | 39 | ; CHECK-LABEL: test_popc32( |
| 40 | define i32 @test_popc32(i32 %a) { |
| 41 | ; CHECK: popc.b32 |
| 42 | %val = call i32 @llvm.ctpop.i32(i32 %a) |
| 43 | ret i32 %val |
| 44 | } |
| 45 | |
| 46 | ; CHECK-LABEL: test_popc64 |
| 47 | define i64 @test_popc64(i64 %a) { |
| 48 | ; CHECK: popc.b64 |
| 49 | ; CHECK: cvt.u64.u32 |
| 50 | %val = call i64 @llvm.ctpop.i64(i64 %a) |
| 51 | ret i64 %val |
| 52 | } |
| 53 | |
| 54 | ; NVPTX popc.b64 returns an i32 even though @llvm.ctpop.i64 returns an i64, so |
| 55 | ; if this function returns an i32, there's no need to do any type conversions |
| 56 | ; in the ptx. |
| 57 | ; CHECK-LABEL: test_popc64_trunc |
| 58 | define i32 @test_popc64_trunc(i64 %a) { |
| 59 | ; CHECK: popc.b64 |
| 60 | ; CHECK-NOT: cvt. |
| 61 | %val = call i64 @llvm.ctpop.i64(i64 %a) |
| 62 | %trunc = trunc i64 %val to i32 |
| 63 | ret i32 %trunc |
| 64 | } |
| 65 | |
| 66 | ; llvm.ctpop.i16 is implemenented by converting to i32, running popc.b32, and |
| 67 | ; then converting back to i16. |
| 68 | ; CHECK-LABEL: test_popc16 |
| 69 | define void @test_popc16(i16 %a, i16* %b) { |
| 70 | ; CHECK: cvt.u32.u16 |
| 71 | ; CHECK: popc.b32 |
| 72 | ; CHECK: cvt.u16.u32 |
| 73 | %val = call i16 @llvm.ctpop.i16(i16 %a) |
| 74 | store i16 %val, i16* %b |
| 75 | ret void |
| 76 | } |
| 77 | |
| 78 | ; If we call llvm.ctpop.i16 and then zext the result to i32, we shouldn't need |
| 79 | ; to do any conversions after calling popc.b32, because that returns an i32. |
| 80 | ; CHECK-LABEL: test_popc16_to_32 |
| 81 | define i32 @test_popc16_to_32(i16 %a) { |
| 82 | ; CHECK: cvt.u32.u16 |
| 83 | ; CHECK: popc.b32 |
| 84 | ; CHECK-NOT: cvt. |
| 85 | %val = call i16 @llvm.ctpop.i16(i16 %a) |
| 86 | %zext = zext i16 %val to i32 |
| 87 | ret i32 %zext |
| 88 | } |
| 89 | |
Peter Collingbourne | 913869b | 2012-05-28 21:48:37 +0000 | [diff] [blame] | 90 | declare float @llvm.fabs.f32(float) |
| 91 | declare double @llvm.fabs.f64(double) |
Justin Holewinski | 48f4ad3 | 2013-05-21 16:51:30 +0000 | [diff] [blame] | 92 | declare float @llvm.nvvm.sqrt.f(float) |
Justin Lebar | c7d2012 | 2017-01-18 00:08:10 +0000 | [diff] [blame] | 93 | declare i32 @llvm.bitreverse.i32(i32) |
| 94 | declare i64 @llvm.bitreverse.i64(i64) |
Justin Lebar | 1091a9f | 2017-01-18 00:08:27 +0000 | [diff] [blame^] | 95 | declare i16 @llvm.ctpop.i16(i16) |
| 96 | declare i32 @llvm.ctpop.i32(i32) |
| 97 | declare i64 @llvm.ctpop.i64(i64) |