Tom Stellard | 49f8bfd | 2015-01-06 18:00:21 +0000 | [diff] [blame] | 1 | ; RUN: llc -march=amdgcn -mcpu=tahiti -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s |
Marek Olsak | 7517077 | 2015-01-27 17:27:15 +0000 | [diff] [blame] | 2 | ; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s |
Tom Stellard | 2a6a6105 | 2013-07-12 18:15:08 +0000 | [diff] [blame] | 3 | |
Matt Arsenault | 20711b7 | 2015-02-20 22:10:45 +0000 | [diff] [blame] | 4 | declare double @llvm.fabs.f64(double) #0 |
| 5 | |
Tom Stellard | 79243d9 | 2014-10-01 17:15:17 +0000 | [diff] [blame] | 6 | ; SI-LABEL: {{^}}fsub_f64: |
Tom Stellard | 326d6ec | 2014-11-05 14:50:53 +0000 | [diff] [blame] | 7 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
Tom Stellard | 2a6a6105 | 2013-07-12 18:15:08 +0000 | [diff] [blame] | 8 | define void @fsub_f64(double addrspace(1)* %out, double addrspace(1)* %in1, |
| 9 | double addrspace(1)* %in2) { |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 10 | %r0 = load double, double addrspace(1)* %in1 |
| 11 | %r1 = load double, double addrspace(1)* %in2 |
Matt Arsenault | 20711b7 | 2015-02-20 22:10:45 +0000 | [diff] [blame] | 12 | %r2 = fsub double %r0, %r1 |
| 13 | store double %r2, double addrspace(1)* %out |
| 14 | ret void |
Tom Stellard | 2a6a6105 | 2013-07-12 18:15:08 +0000 | [diff] [blame] | 15 | } |
Matt Arsenault | 20711b7 | 2015-02-20 22:10:45 +0000 | [diff] [blame] | 16 | |
| 17 | ; SI-LABEL: {{^}}fsub_fabs_f64: |
| 18 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], -\|v\[[0-9]+:[0-9]+\]\|}} |
| 19 | define void @fsub_fabs_f64(double addrspace(1)* %out, double addrspace(1)* %in1, |
| 20 | double addrspace(1)* %in2) { |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 21 | %r0 = load double, double addrspace(1)* %in1 |
| 22 | %r1 = load double, double addrspace(1)* %in2 |
Matt Arsenault | 20711b7 | 2015-02-20 22:10:45 +0000 | [diff] [blame] | 23 | %r1.fabs = call double @llvm.fabs.f64(double %r1) #0 |
| 24 | %r2 = fsub double %r0, %r1.fabs |
| 25 | store double %r2, double addrspace(1)* %out |
| 26 | ret void |
| 27 | } |
| 28 | |
| 29 | ; SI-LABEL: {{^}}fsub_fabs_inv_f64: |
| 30 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], |v\[[0-9]+:[0-9]+\]|, -v\[[0-9]+:[0-9]+\]}} |
| 31 | define void @fsub_fabs_inv_f64(double addrspace(1)* %out, double addrspace(1)* %in1, |
| 32 | double addrspace(1)* %in2) { |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 33 | %r0 = load double, double addrspace(1)* %in1 |
| 34 | %r1 = load double, double addrspace(1)* %in2 |
Matt Arsenault | 20711b7 | 2015-02-20 22:10:45 +0000 | [diff] [blame] | 35 | %r0.fabs = call double @llvm.fabs.f64(double %r0) #0 |
| 36 | %r2 = fsub double %r0.fabs, %r1 |
| 37 | store double %r2, double addrspace(1)* %out |
| 38 | ret void |
| 39 | } |
| 40 | |
| 41 | ; SI-LABEL: {{^}}s_fsub_f64: |
| 42 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], s\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
| 43 | define void @s_fsub_f64(double addrspace(1)* %out, double %a, double %b) { |
| 44 | %sub = fsub double %a, %b |
| 45 | store double %sub, double addrspace(1)* %out |
| 46 | ret void |
| 47 | } |
| 48 | |
| 49 | ; SI-LABEL: {{^}}s_fsub_imm_f64: |
Matt Arsenault | 3d1c1de | 2016-04-14 21:58:24 +0000 | [diff] [blame] | 50 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], -s\[[0-9]+:[0-9]+\]}}, 4.0 |
Matt Arsenault | 20711b7 | 2015-02-20 22:10:45 +0000 | [diff] [blame] | 51 | define void @s_fsub_imm_f64(double addrspace(1)* %out, double %a, double %b) { |
| 52 | %sub = fsub double 4.0, %a |
| 53 | store double %sub, double addrspace(1)* %out |
| 54 | ret void |
| 55 | } |
| 56 | |
| 57 | ; SI-LABEL: {{^}}s_fsub_imm_inv_f64: |
Matt Arsenault | 3d1c1de | 2016-04-14 21:58:24 +0000 | [diff] [blame] | 58 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], s\[[0-9]+:[0-9]+\]}}, -4.0 |
Matt Arsenault | 20711b7 | 2015-02-20 22:10:45 +0000 | [diff] [blame] | 59 | define void @s_fsub_imm_inv_f64(double addrspace(1)* %out, double %a, double %b) { |
| 60 | %sub = fsub double %a, 4.0 |
| 61 | store double %sub, double addrspace(1)* %out |
| 62 | ret void |
| 63 | } |
| 64 | |
| 65 | ; SI-LABEL: {{^}}s_fsub_self_f64: |
| 66 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], s\[[0-9]+:[0-9]+\], -s\[[0-9]+:[0-9]+\]}} |
| 67 | define void @s_fsub_self_f64(double addrspace(1)* %out, double %a) { |
| 68 | %sub = fsub double %a, %a |
| 69 | store double %sub, double addrspace(1)* %out |
| 70 | ret void |
| 71 | } |
| 72 | |
| 73 | ; SI-LABEL: {{^}}fsub_v2f64: |
| 74 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], s\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
| 75 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], s\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
| 76 | define void @fsub_v2f64(<2 x double> addrspace(1)* %out, <2 x double> %a, <2 x double> %b) { |
| 77 | %sub = fsub <2 x double> %a, %b |
| 78 | store <2 x double> %sub, <2 x double> addrspace(1)* %out |
| 79 | ret void |
| 80 | } |
| 81 | |
| 82 | ; SI-LABEL: {{^}}fsub_v4f64: |
| 83 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
| 84 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
| 85 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
| 86 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
| 87 | define void @fsub_v4f64(<4 x double> addrspace(1)* %out, <4 x double> addrspace(1)* %in) { |
David Blaikie | 79e6c74 | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 88 | %b_ptr = getelementptr <4 x double>, <4 x double> addrspace(1)* %in, i32 1 |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 89 | %a = load <4 x double>, <4 x double> addrspace(1)* %in |
| 90 | %b = load <4 x double>, <4 x double> addrspace(1)* %b_ptr |
Matt Arsenault | 20711b7 | 2015-02-20 22:10:45 +0000 | [diff] [blame] | 91 | %result = fsub <4 x double> %a, %b |
| 92 | store <4 x double> %result, <4 x double> addrspace(1)* %out |
| 93 | ret void |
| 94 | } |
| 95 | |
| 96 | ; SI-LABEL: {{^}}s_fsub_v4f64: |
| 97 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], s\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
| 98 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], s\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
| 99 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], s\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
| 100 | ; SI: v_add_f64 {{v\[[0-9]+:[0-9]+\], s\[[0-9]+:[0-9]+\], -v\[[0-9]+:[0-9]+\]}} |
| 101 | define void @s_fsub_v4f64(<4 x double> addrspace(1)* %out, <4 x double> %a, <4 x double> %b) { |
| 102 | %result = fsub <4 x double> %a, %b |
| 103 | store <4 x double> %result, <4 x double> addrspace(1)* %out, align 16 |
| 104 | ret void |
| 105 | } |
| 106 | |
| 107 | attributes #0 = { nounwind readnone } |