blob: d37d432842f37d1b94fa73a78bb13bde38546ceb [file] [log] [blame]
Alexander Timofeev982aee62017-07-04 17:32:00 +00001; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=tahiti -verify-machineinstrs < %s | FileCheck -check-prefix=FUNC -check-prefix=SI %s
2; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=FUNC -check-prefix=SI %s
Tom Stellard7512c082013-07-12 18:14:56 +00003
Tom Stellard79243d92014-10-01 17:15:17 +00004; FUNC-LABEL: {{^}}fmul_f64:
Tom Stellard326d6ec2014-11-05 14:50:53 +00005; SI: v_mul_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\]}}
Matt Arsenault3dbeefa2017-03-21 21:39:51 +00006define amdgpu_kernel void @fmul_f64(double addrspace(1)* %out, double addrspace(1)* %in1,
Tom Stellard7512c082013-07-12 18:14:56 +00007 double addrspace(1)* %in2) {
David Blaikiea79ac142015-02-27 21:17:42 +00008 %r0 = load double, double addrspace(1)* %in1
9 %r1 = load double, double addrspace(1)* %in2
Tom Stellard7512c082013-07-12 18:14:56 +000010 %r2 = fmul double %r0, %r1
11 store double %r2, double addrspace(1)* %out
12 ret void
13}
Matt Arsenault0fd0a312014-09-15 17:04:54 +000014
Tom Stellard79243d92014-10-01 17:15:17 +000015; FUNC-LABEL: {{^}}fmul_v2f64:
Tom Stellard326d6ec2014-11-05 14:50:53 +000016; SI: v_mul_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\]}}
17; SI: v_mul_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\]}}
Matt Arsenault3dbeefa2017-03-21 21:39:51 +000018define amdgpu_kernel void @fmul_v2f64(<2 x double> addrspace(1)* %out, <2 x double> addrspace(1)* %in1,
Matt Arsenault0fd0a312014-09-15 17:04:54 +000019 <2 x double> addrspace(1)* %in2) {
David Blaikiea79ac142015-02-27 21:17:42 +000020 %r0 = load <2 x double>, <2 x double> addrspace(1)* %in1
21 %r1 = load <2 x double>, <2 x double> addrspace(1)* %in2
Matt Arsenault0fd0a312014-09-15 17:04:54 +000022 %r2 = fmul <2 x double> %r0, %r1
23 store <2 x double> %r2, <2 x double> addrspace(1)* %out
24 ret void
25}
26
Tom Stellard79243d92014-10-01 17:15:17 +000027; FUNC-LABEL: {{^}}fmul_v4f64:
Tom Stellard326d6ec2014-11-05 14:50:53 +000028; SI: v_mul_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\]}}
29; SI: v_mul_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\]}}
30; SI: v_mul_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\]}}
31; SI: v_mul_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\]}}
Matt Arsenault3dbeefa2017-03-21 21:39:51 +000032define amdgpu_kernel void @fmul_v4f64(<4 x double> addrspace(1)* %out, <4 x double> addrspace(1)* %in1,
Matt Arsenault0fd0a312014-09-15 17:04:54 +000033 <4 x double> addrspace(1)* %in2) {
David Blaikiea79ac142015-02-27 21:17:42 +000034 %r0 = load <4 x double>, <4 x double> addrspace(1)* %in1
35 %r1 = load <4 x double>, <4 x double> addrspace(1)* %in2
Matt Arsenault0fd0a312014-09-15 17:04:54 +000036 %r2 = fmul <4 x double> %r0, %r1
37 store <4 x double> %r2, <4 x double> addrspace(1)* %out
38 ret void
39}