blob: 72941b3a46691810cd72bce847ccf93e8dab0dd9 [file] [log] [blame]
Matt Arsenaulta1474382014-08-15 18:42:15 +00001; RUN: llc -march=r600 -mcpu=SI -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
2
3declare i32 @llvm.r600.read.tidig.x() nounwind readnone
4
5declare double @fabs(double) readnone
6declare double @llvm.fabs.f64(double) readnone
7declare <2 x double> @llvm.fabs.v2f64(<2 x double>) readnone
8declare <4 x double> @llvm.fabs.v4f64(<4 x double>) readnone
9
Tom Stellard79243d92014-10-01 17:15:17 +000010; FUNC-LABEL: {{^}}v_fabs_f64:
Matt Arsenaulta1474382014-08-15 18:42:15 +000011; SI: V_AND_B32
12; SI: S_ENDPGM
13define void @v_fabs_f64(double addrspace(1)* %out, double addrspace(1)* %in) {
14 %tid = call i32 @llvm.r600.read.tidig.x() nounwind readnone
15 %tidext = sext i32 %tid to i64
16 %gep = getelementptr double addrspace(1)* %in, i64 %tidext
17 %val = load double addrspace(1)* %gep, align 8
18 %fabs = call double @llvm.fabs.f64(double %val)
19 store double %fabs, double addrspace(1)* %out
20 ret void
21}
22
Tom Stellard79243d92014-10-01 17:15:17 +000023; FUNC-LABEL: {{^}}fabs_f64:
Matt Arsenaulta1474382014-08-15 18:42:15 +000024; SI: V_AND_B32
25; SI-NOT: V_AND_B32
26; SI: S_ENDPGM
27define void @fabs_f64(double addrspace(1)* %out, double %in) {
28 %fabs = call double @llvm.fabs.f64(double %in)
29 store double %fabs, double addrspace(1)* %out
30 ret void
31}
32
Tom Stellard79243d92014-10-01 17:15:17 +000033; FUNC-LABEL: {{^}}fabs_v2f64:
Matt Arsenaulta1474382014-08-15 18:42:15 +000034; SI: V_AND_B32
35; SI: V_AND_B32
36; SI: S_ENDPGM
37define void @fabs_v2f64(<2 x double> addrspace(1)* %out, <2 x double> %in) {
38 %fabs = call <2 x double> @llvm.fabs.v2f64(<2 x double> %in)
39 store <2 x double> %fabs, <2 x double> addrspace(1)* %out
40 ret void
41}
42
Tom Stellard79243d92014-10-01 17:15:17 +000043; FUNC-LABEL: {{^}}fabs_v4f64:
Matt Arsenaulta1474382014-08-15 18:42:15 +000044; SI: V_AND_B32
45; SI: V_AND_B32
46; SI: V_AND_B32
47; SI: V_AND_B32
48; SI: S_ENDPGM
49define void @fabs_v4f64(<4 x double> addrspace(1)* %out, <4 x double> %in) {
50 %fabs = call <4 x double> @llvm.fabs.v4f64(<4 x double> %in)
51 store <4 x double> %fabs, <4 x double> addrspace(1)* %out
52 ret void
53}
54
Tom Stellard79243d92014-10-01 17:15:17 +000055; SI-LABEL: {{^}}fabs_fold_f64:
Matt Arsenaulta1474382014-08-15 18:42:15 +000056; SI: S_LOAD_DWORDX2 [[ABS_VALUE:s\[[0-9]+:[0-9]+\]]], {{s\[[0-9]+:[0-9]+\]}}, 0xb
57; SI-NOT: AND
58; SI: V_MUL_F64 {{v\[[0-9]+:[0-9]+\]}}, |[[ABS_VALUE]]|, {{v\[[0-9]+:[0-9]+\]}}
59; SI: S_ENDPGM
60define void @fabs_fold_f64(double addrspace(1)* %out, double %in0, double %in1) {
61 %fabs = call double @llvm.fabs.f64(double %in0)
62 %fmul = fmul double %fabs, %in1
63 store double %fmul, double addrspace(1)* %out
64 ret void
65}
66
Tom Stellard79243d92014-10-01 17:15:17 +000067; SI-LABEL: {{^}}fabs_fn_fold_f64:
Matt Arsenaulta1474382014-08-15 18:42:15 +000068; SI: S_LOAD_DWORDX2 [[ABS_VALUE:s\[[0-9]+:[0-9]+\]]], {{s\[[0-9]+:[0-9]+\]}}, 0xb
69; SI-NOT: AND
70; SI: V_MUL_F64 {{v\[[0-9]+:[0-9]+\]}}, |[[ABS_VALUE]]|, {{v\[[0-9]+:[0-9]+\]}}
71; SI: S_ENDPGM
72define void @fabs_fn_fold_f64(double addrspace(1)* %out, double %in0, double %in1) {
73 %fabs = call double @fabs(double %in0)
74 %fmul = fmul double %fabs, %in1
75 store double %fmul, double addrspace(1)* %out
76 ret void
77}
78
Tom Stellard79243d92014-10-01 17:15:17 +000079; FUNC-LABEL: {{^}}fabs_free_f64:
Matt Arsenaulta1474382014-08-15 18:42:15 +000080; SI: V_AND_B32
81; SI: S_ENDPGM
82define void @fabs_free_f64(double addrspace(1)* %out, i64 %in) {
83 %bc= bitcast i64 %in to double
84 %fabs = call double @llvm.fabs.f64(double %bc)
85 store double %fabs, double addrspace(1)* %out
86 ret void
87}
88
Tom Stellard79243d92014-10-01 17:15:17 +000089; FUNC-LABEL: {{^}}fabs_fn_free_f64:
Matt Arsenaulta1474382014-08-15 18:42:15 +000090; SI: V_AND_B32
91; SI: S_ENDPGM
92define void @fabs_fn_free_f64(double addrspace(1)* %out, i64 %in) {
93 %bc= bitcast i64 %in to double
94 %fabs = call double @fabs(double %bc)
95 store double %fabs, double addrspace(1)* %out
96 ret void
97}