blob: c78fd549b31659230a160ee9f851fa6dbb9dd79f [file] [log] [blame]
Matt Arsenaultb45c78b2015-01-21 22:56:15 +00001; RUN: llc -march=amdgcn -mcpu=SI < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
Marek Olsak75170772015-01-27 17:27:15 +00002; RUN: llc -march=amdgcn -mcpu=tonga < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
Matt Arsenault717c1d02014-06-15 21:08:58 +00003; RUN: llc -march=r600 -mcpu=redwood < %s
4
5define void @srem_i32(i32 addrspace(1)* %out, i32 addrspace(1)* %in) {
David Blaikie79e6c742015-02-27 19:29:02 +00006 %den_ptr = getelementptr i32, i32 addrspace(1)* %in, i32 1
David Blaikiea79ac142015-02-27 21:17:42 +00007 %num = load i32, i32 addrspace(1) * %in
8 %den = load i32, i32 addrspace(1) * %den_ptr
Matt Arsenault717c1d02014-06-15 21:08:58 +00009 %result = srem i32 %num, %den
10 store i32 %result, i32 addrspace(1)* %out
11 ret void
12}
13
14define void @srem_i32_4(i32 addrspace(1)* %out, i32 addrspace(1)* %in) {
David Blaikiea79ac142015-02-27 21:17:42 +000015 %num = load i32, i32 addrspace(1) * %in
Matt Arsenault717c1d02014-06-15 21:08:58 +000016 %result = srem i32 %num, 4
17 store i32 %result, i32 addrspace(1)* %out
18 ret void
19}
20
Matt Arsenaultb45c78b2015-01-21 22:56:15 +000021; FUNC-LABEL: {{^}}srem_i32_7:
22; SI: v_mov_b32_e32 [[MAGIC:v[0-9]+]], 0x92492493
23; SI: v_mul_hi_i32 {{v[0-9]+}}, [[MAGIC]],
24; SI: v_mul_lo_i32
25; SI: v_sub_i32
26; SI: s_endpgm
27define void @srem_i32_7(i32 addrspace(1)* %out, i32 addrspace(1)* %in) {
David Blaikiea79ac142015-02-27 21:17:42 +000028 %num = load i32, i32 addrspace(1) * %in
Matt Arsenaultb45c78b2015-01-21 22:56:15 +000029 %result = srem i32 %num, 7
30 store i32 %result, i32 addrspace(1)* %out
31 ret void
32}
33
Matt Arsenault717c1d02014-06-15 21:08:58 +000034define void @srem_v2i32(<2 x i32> addrspace(1)* %out, <2 x i32> addrspace(1)* %in) {
David Blaikie79e6c742015-02-27 19:29:02 +000035 %den_ptr = getelementptr <2 x i32>, <2 x i32> addrspace(1)* %in, i32 1
David Blaikiea79ac142015-02-27 21:17:42 +000036 %num = load <2 x i32>, <2 x i32> addrspace(1) * %in
37 %den = load <2 x i32>, <2 x i32> addrspace(1) * %den_ptr
Matt Arsenault717c1d02014-06-15 21:08:58 +000038 %result = srem <2 x i32> %num, %den
39 store <2 x i32> %result, <2 x i32> addrspace(1)* %out
40 ret void
41}
42
43define void @srem_v2i32_4(<2 x i32> addrspace(1)* %out, <2 x i32> addrspace(1)* %in) {
David Blaikiea79ac142015-02-27 21:17:42 +000044 %num = load <2 x i32>, <2 x i32> addrspace(1) * %in
Matt Arsenault717c1d02014-06-15 21:08:58 +000045 %result = srem <2 x i32> %num, <i32 4, i32 4>
46 store <2 x i32> %result, <2 x i32> addrspace(1)* %out
47 ret void
48}
49
50define void @srem_v4i32(<4 x i32> addrspace(1)* %out, <4 x i32> addrspace(1)* %in) {
David Blaikie79e6c742015-02-27 19:29:02 +000051 %den_ptr = getelementptr <4 x i32>, <4 x i32> addrspace(1)* %in, i32 1
David Blaikiea79ac142015-02-27 21:17:42 +000052 %num = load <4 x i32>, <4 x i32> addrspace(1) * %in
53 %den = load <4 x i32>, <4 x i32> addrspace(1) * %den_ptr
Matt Arsenault717c1d02014-06-15 21:08:58 +000054 %result = srem <4 x i32> %num, %den
55 store <4 x i32> %result, <4 x i32> addrspace(1)* %out
56 ret void
57}
58
59define void @srem_v4i32_4(<4 x i32> addrspace(1)* %out, <4 x i32> addrspace(1)* %in) {
David Blaikiea79ac142015-02-27 21:17:42 +000060 %num = load <4 x i32>, <4 x i32> addrspace(1) * %in
Matt Arsenault717c1d02014-06-15 21:08:58 +000061 %result = srem <4 x i32> %num, <i32 4, i32 4, i32 4, i32 4>
62 store <4 x i32> %result, <4 x i32> addrspace(1)* %out
63 ret void
64}
Matt Arsenaultd9987c72015-01-21 22:43:19 +000065
66define void @srem_i64(i64 addrspace(1)* %out, i64 addrspace(1)* %in) {
David Blaikie79e6c742015-02-27 19:29:02 +000067 %den_ptr = getelementptr i64, i64 addrspace(1)* %in, i64 1
David Blaikiea79ac142015-02-27 21:17:42 +000068 %num = load i64, i64 addrspace(1) * %in
69 %den = load i64, i64 addrspace(1) * %den_ptr
Matt Arsenaultd9987c72015-01-21 22:43:19 +000070 %result = srem i64 %num, %den
71 store i64 %result, i64 addrspace(1)* %out
72 ret void
73}
74
75define void @srem_i64_4(i64 addrspace(1)* %out, i64 addrspace(1)* %in) {
David Blaikiea79ac142015-02-27 21:17:42 +000076 %num = load i64, i64 addrspace(1) * %in
Matt Arsenaultd9987c72015-01-21 22:43:19 +000077 %result = srem i64 %num, 4
78 store i64 %result, i64 addrspace(1)* %out
79 ret void
80}
81
82define void @srem_v2i64(<2 x i64> addrspace(1)* %out, <2 x i64> addrspace(1)* %in) {
David Blaikie79e6c742015-02-27 19:29:02 +000083 %den_ptr = getelementptr <2 x i64>, <2 x i64> addrspace(1)* %in, i64 1
David Blaikiea79ac142015-02-27 21:17:42 +000084 %num = load <2 x i64>, <2 x i64> addrspace(1) * %in
85 %den = load <2 x i64>, <2 x i64> addrspace(1) * %den_ptr
Matt Arsenaultd9987c72015-01-21 22:43:19 +000086 %result = srem <2 x i64> %num, %den
87 store <2 x i64> %result, <2 x i64> addrspace(1)* %out
88 ret void
89}
90
91define void @srem_v2i64_4(<2 x i64> addrspace(1)* %out, <2 x i64> addrspace(1)* %in) {
David Blaikiea79ac142015-02-27 21:17:42 +000092 %num = load <2 x i64>, <2 x i64> addrspace(1) * %in
Matt Arsenaultd9987c72015-01-21 22:43:19 +000093 %result = srem <2 x i64> %num, <i64 4, i64 4>
94 store <2 x i64> %result, <2 x i64> addrspace(1)* %out
95 ret void
96}
97
98define void @srem_v4i64(<4 x i64> addrspace(1)* %out, <4 x i64> addrspace(1)* %in) {
David Blaikie79e6c742015-02-27 19:29:02 +000099 %den_ptr = getelementptr <4 x i64>, <4 x i64> addrspace(1)* %in, i64 1
David Blaikiea79ac142015-02-27 21:17:42 +0000100 %num = load <4 x i64>, <4 x i64> addrspace(1) * %in
101 %den = load <4 x i64>, <4 x i64> addrspace(1) * %den_ptr
Matt Arsenaultd9987c72015-01-21 22:43:19 +0000102 %result = srem <4 x i64> %num, %den
103 store <4 x i64> %result, <4 x i64> addrspace(1)* %out
104 ret void
105}
106
107define void @srem_v4i64_4(<4 x i64> addrspace(1)* %out, <4 x i64> addrspace(1)* %in) {
David Blaikiea79ac142015-02-27 21:17:42 +0000108 %num = load <4 x i64>, <4 x i64> addrspace(1) * %in
Matt Arsenaultd9987c72015-01-21 22:43:19 +0000109 %result = srem <4 x i64> %num, <i64 4, i64 4, i64 4, i64 4>
110 store <4 x i64> %result, <4 x i64> addrspace(1)* %out
111 ret void
112}