blob: 509b547a5c82a17679f47cc037d98e43a79b7a43 [file] [log] [blame]
Tim Northover3b0846e2014-05-24 12:50:23 +00001; RUN: llc -mtriple=aarch64-none-linux-gnu < %s | FileCheck %s --check-prefix=CHECK
Tim Northovere0e3aef2013-01-31 12:12:40 +00002
3; First, a simple example from Clang. The registers could plausibly be
4; different, but probably won't be.
5
6%struct.foo = type { i8, [2 x i8], i8 }
7
8define [1 x i64] @from_clang([1 x i64] %f.coerce, i32 %n) nounwind readnone {
Stephen Lind24ab202013-07-14 06:24:09 +00009; CHECK-LABEL: from_clang:
Tim Northover534acbd2014-05-01 12:29:38 +000010; CHECK: bfi {{w[0-9]+}}, {{w[0-9]+}}, #3, #4
Tim Northovere0e3aef2013-01-31 12:12:40 +000011
12entry:
13 %f.coerce.fca.0.extract = extractvalue [1 x i64] %f.coerce, 0
14 %tmp.sroa.0.0.extract.trunc = trunc i64 %f.coerce.fca.0.extract to i32
15 %bf.value = shl i32 %n, 3
16 %0 = and i32 %bf.value, 120
17 %f.sroa.0.0.insert.ext.masked = and i32 %tmp.sroa.0.0.extract.trunc, 135
18 %1 = or i32 %f.sroa.0.0.insert.ext.masked, %0
19 %f.sroa.0.0.extract.trunc = zext i32 %1 to i64
20 %tmp1.sroa.1.1.insert.insert = and i64 %f.coerce.fca.0.extract, 4294967040
21 %tmp1.sroa.0.0.insert.insert = or i64 %f.sroa.0.0.extract.trunc, %tmp1.sroa.1.1.insert.insert
22 %.fca.0.insert = insertvalue [1 x i64] undef, i64 %tmp1.sroa.0.0.insert.insert, 0
23 ret [1 x i64] %.fca.0.insert
24}
25
26define void @test_whole32(i32* %existing, i32* %new) {
Stephen Linf799e3f2013-07-13 20:38:47 +000027; CHECK-LABEL: test_whole32:
Tim Northovereb6611e2014-04-24 12:11:53 +000028
Tim Northover534acbd2014-05-01 12:29:38 +000029; CHECK: bfi {{w[0-9]+}}, {{w[0-9]+}}, #26, #5
Tim Northovere0e3aef2013-01-31 12:12:40 +000030
David Blaikiea79ac142015-02-27 21:17:42 +000031 %oldval = load volatile i32, i32* %existing
Tim Northovere0e3aef2013-01-31 12:12:40 +000032 %oldval_keep = and i32 %oldval, 2214592511 ; =0x83ffffff
33
David Blaikiea79ac142015-02-27 21:17:42 +000034 %newval = load volatile i32, i32* %new
Tim Northovere0e3aef2013-01-31 12:12:40 +000035 %newval_shifted = shl i32 %newval, 26
36 %newval_masked = and i32 %newval_shifted, 2080374784 ; = 0x7c000000
37
38 %combined = or i32 %oldval_keep, %newval_masked
39 store volatile i32 %combined, i32* %existing
40
41 ret void
42}
43
44define void @test_whole64(i64* %existing, i64* %new) {
Stephen Linf799e3f2013-07-13 20:38:47 +000045; CHECK-LABEL: test_whole64:
Tim Northover534acbd2014-05-01 12:29:38 +000046; CHECK: bfi {{x[0-9]+}}, {{x[0-9]+}}, #26, #14
Tim Northovere0e3aef2013-01-31 12:12:40 +000047; CHECK-NOT: and
48; CHECK: ret
49
David Blaikiea79ac142015-02-27 21:17:42 +000050 %oldval = load volatile i64, i64* %existing
Tim Northovere0e3aef2013-01-31 12:12:40 +000051 %oldval_keep = and i64 %oldval, 18446742974265032703 ; = 0xffffff0003ffffffL
52
David Blaikiea79ac142015-02-27 21:17:42 +000053 %newval = load volatile i64, i64* %new
Tim Northovere0e3aef2013-01-31 12:12:40 +000054 %newval_shifted = shl i64 %newval, 26
55 %newval_masked = and i64 %newval_shifted, 1099444518912 ; = 0xfffc000000
56
57 %combined = or i64 %oldval_keep, %newval_masked
58 store volatile i64 %combined, i64* %existing
59
60 ret void
61}
62
63define void @test_whole32_from64(i64* %existing, i64* %new) {
Stephen Linf799e3f2013-07-13 20:38:47 +000064; CHECK-LABEL: test_whole32_from64:
Tim Northovereb6611e2014-04-24 12:11:53 +000065
Tim Northover534acbd2014-05-01 12:29:38 +000066
Tim Northover3b0846e2014-05-24 12:50:23 +000067; CHECK: bfxil {{x[0-9]+}}, {{x[0-9]+}}, #0, #16
Tim Northovereb6611e2014-04-24 12:11:53 +000068
Tim Northovere0e3aef2013-01-31 12:12:40 +000069; CHECK: ret
70
David Blaikiea79ac142015-02-27 21:17:42 +000071 %oldval = load volatile i64, i64* %existing
Tim Northovere0e3aef2013-01-31 12:12:40 +000072 %oldval_keep = and i64 %oldval, 4294901760 ; = 0xffff0000
73
David Blaikiea79ac142015-02-27 21:17:42 +000074 %newval = load volatile i64, i64* %new
Tim Northovere0e3aef2013-01-31 12:12:40 +000075 %newval_masked = and i64 %newval, 65535 ; = 0xffff
76
77 %combined = or i64 %oldval_keep, %newval_masked
78 store volatile i64 %combined, i64* %existing
79
80 ret void
81}
82
83define void @test_32bit_masked(i32 *%existing, i32 *%new) {
Stephen Linf799e3f2013-07-13 20:38:47 +000084; CHECK-LABEL: test_32bit_masked:
Tim Northovereb6611e2014-04-24 12:11:53 +000085
Tim Northover3b0846e2014-05-24 12:50:23 +000086; CHECK: and
Tim Northover534acbd2014-05-01 12:29:38 +000087; CHECK: bfi [[INSERT:w[0-9]+]], {{w[0-9]+}}, #3, #4
Tim Northovere0e3aef2013-01-31 12:12:40 +000088
David Blaikiea79ac142015-02-27 21:17:42 +000089 %oldval = load volatile i32, i32* %existing
Tim Northovere0e3aef2013-01-31 12:12:40 +000090 %oldval_keep = and i32 %oldval, 135 ; = 0x87
91
David Blaikiea79ac142015-02-27 21:17:42 +000092 %newval = load volatile i32, i32* %new
Tim Northovere0e3aef2013-01-31 12:12:40 +000093 %newval_shifted = shl i32 %newval, 3
94 %newval_masked = and i32 %newval_shifted, 120 ; = 0x78
95
96 %combined = or i32 %oldval_keep, %newval_masked
97 store volatile i32 %combined, i32* %existing
98
99 ret void
100}
101
102define void @test_64bit_masked(i64 *%existing, i64 *%new) {
Stephen Linf799e3f2013-07-13 20:38:47 +0000103; CHECK-LABEL: test_64bit_masked:
Tim Northover3b0846e2014-05-24 12:50:23 +0000104; CHECK: and
Tim Northover534acbd2014-05-01 12:29:38 +0000105; CHECK: bfi [[INSERT:x[0-9]+]], {{x[0-9]+}}, #40, #8
Tim Northovere0e3aef2013-01-31 12:12:40 +0000106
David Blaikiea79ac142015-02-27 21:17:42 +0000107 %oldval = load volatile i64, i64* %existing
Tim Northovere0e3aef2013-01-31 12:12:40 +0000108 %oldval_keep = and i64 %oldval, 1095216660480 ; = 0xff_0000_0000
109
David Blaikiea79ac142015-02-27 21:17:42 +0000110 %newval = load volatile i64, i64* %new
Tim Northovere0e3aef2013-01-31 12:12:40 +0000111 %newval_shifted = shl i64 %newval, 40
112 %newval_masked = and i64 %newval_shifted, 280375465082880 ; = 0xff00_0000_0000
113
114 %combined = or i64 %newval_masked, %oldval_keep
115 store volatile i64 %combined, i64* %existing
116
117 ret void
118}
119
120; Mask is too complicated for literal ANDwwi, make sure other avenues are tried.
121define void @test_32bit_complexmask(i32 *%existing, i32 *%new) {
Stephen Linf799e3f2013-07-13 20:38:47 +0000122; CHECK-LABEL: test_32bit_complexmask:
Tim Northovereb6611e2014-04-24 12:11:53 +0000123
Tim Northover3b0846e2014-05-24 12:50:23 +0000124; CHECK: and
Tim Northover534acbd2014-05-01 12:29:38 +0000125; CHECK: bfi {{w[0-9]+}}, {{w[0-9]+}}, #3, #4
Tim Northovere0e3aef2013-01-31 12:12:40 +0000126
David Blaikiea79ac142015-02-27 21:17:42 +0000127 %oldval = load volatile i32, i32* %existing
Tim Northovere0e3aef2013-01-31 12:12:40 +0000128 %oldval_keep = and i32 %oldval, 647 ; = 0x287
129
David Blaikiea79ac142015-02-27 21:17:42 +0000130 %newval = load volatile i32, i32* %new
Tim Northovere0e3aef2013-01-31 12:12:40 +0000131 %newval_shifted = shl i32 %newval, 3
132 %newval_masked = and i32 %newval_shifted, 120 ; = 0x278
133
134 %combined = or i32 %oldval_keep, %newval_masked
135 store volatile i32 %combined, i32* %existing
136
137 ret void
138}
139
140; Neither mask is is a contiguous set of 1s. BFI can't be used
141define void @test_32bit_badmask(i32 *%existing, i32 *%new) {
Stephen Linf799e3f2013-07-13 20:38:47 +0000142; CHECK-LABEL: test_32bit_badmask:
Tim Northovere0e3aef2013-01-31 12:12:40 +0000143; CHECK-NOT: bfi
Tim Northovereb6611e2014-04-24 12:11:53 +0000144; CHECK-NOT: bfm
Tim Northovere0e3aef2013-01-31 12:12:40 +0000145; CHECK: ret
146
David Blaikiea79ac142015-02-27 21:17:42 +0000147 %oldval = load volatile i32, i32* %existing
Tim Northovere0e3aef2013-01-31 12:12:40 +0000148 %oldval_keep = and i32 %oldval, 135 ; = 0x87
149
David Blaikiea79ac142015-02-27 21:17:42 +0000150 %newval = load volatile i32, i32* %new
Tim Northovere0e3aef2013-01-31 12:12:40 +0000151 %newval_shifted = shl i32 %newval, 3
152 %newval_masked = and i32 %newval_shifted, 632 ; = 0x278
153
154 %combined = or i32 %oldval_keep, %newval_masked
155 store volatile i32 %combined, i32* %existing
156
157 ret void
158}
159
160; Ditto
161define void @test_64bit_badmask(i64 *%existing, i64 *%new) {
Stephen Linf799e3f2013-07-13 20:38:47 +0000162; CHECK-LABEL: test_64bit_badmask:
Tim Northovere0e3aef2013-01-31 12:12:40 +0000163; CHECK-NOT: bfi
Tim Northovereb6611e2014-04-24 12:11:53 +0000164; CHECK-NOT: bfm
Tim Northovere0e3aef2013-01-31 12:12:40 +0000165; CHECK: ret
166
David Blaikiea79ac142015-02-27 21:17:42 +0000167 %oldval = load volatile i64, i64* %existing
Tim Northovere0e3aef2013-01-31 12:12:40 +0000168 %oldval_keep = and i64 %oldval, 135 ; = 0x87
169
David Blaikiea79ac142015-02-27 21:17:42 +0000170 %newval = load volatile i64, i64* %new
Tim Northovere0e3aef2013-01-31 12:12:40 +0000171 %newval_shifted = shl i64 %newval, 3
172 %newval_masked = and i64 %newval_shifted, 664 ; = 0x278
173
174 %combined = or i64 %oldval_keep, %newval_masked
175 store volatile i64 %combined, i64* %existing
176
177 ret void
178}
179
180; Bitfield insert where there's a left-over shr needed at the beginning
181; (e.g. result of str.bf1 = str.bf2)
182define void @test_32bit_with_shr(i32* %existing, i32* %new) {
Stephen Linf799e3f2013-07-13 20:38:47 +0000183; CHECK-LABEL: test_32bit_with_shr:
Tim Northovere0e3aef2013-01-31 12:12:40 +0000184
David Blaikiea79ac142015-02-27 21:17:42 +0000185 %oldval = load volatile i32, i32* %existing
Tim Northovere0e3aef2013-01-31 12:12:40 +0000186 %oldval_keep = and i32 %oldval, 2214592511 ; =0x83ffffff
187
David Blaikiea79ac142015-02-27 21:17:42 +0000188 %newval = load i32, i32* %new
Tim Northovere0e3aef2013-01-31 12:12:40 +0000189 %newval_shifted = shl i32 %newval, 12
190 %newval_masked = and i32 %newval_shifted, 2080374784 ; = 0x7c000000
191
192 %combined = or i32 %oldval_keep, %newval_masked
193 store volatile i32 %combined, i32* %existing
194; CHECK: lsr [[BIT:w[0-9]+]], {{w[0-9]+}}, #14
Tim Northover534acbd2014-05-01 12:29:38 +0000195; CHECK: bfi {{w[0-9]+}}, [[BIT]], #26, #5
Tim Northovere0e3aef2013-01-31 12:12:40 +0000196
197 ret void
198}
Geoff Berry43ec15e2015-09-18 17:11:53 +0000199
200; Bitfield insert where the second or operand is a better match to be folded into the BFM
201define void @test_32bit_opnd1_better(i32* %existing, i32* %new) {
202; CHECK-LABEL: test_32bit_opnd1_better:
203
204 %oldval = load volatile i32, i32* %existing
205 %oldval_keep = and i32 %oldval, 65535 ; 0x0000ffff
206
207 %newval = load i32, i32* %new
208 %newval_shifted = shl i32 %newval, 16
209 %newval_masked = and i32 %newval_shifted, 16711680 ; 0x00ff0000
210
211 %combined = or i32 %oldval_keep, %newval_masked
212 store volatile i32 %combined, i32* %existing
213; CHECK: and [[BIT:w[0-9]+]], {{w[0-9]+}}, #0xffff
214; CHECK: bfi [[BIT]], {{w[0-9]+}}, #16, #8
215
216 ret void
217}
Weiming Zhao56ab5182015-12-01 19:17:49 +0000218
219; Tests when all the bits from one operand are not useful
220define i32 @test_nouseful_bits(i8 %a, i32 %b) {
221; CHECK-LABEL: test_nouseful_bits:
222; CHECK: bfi
223; CHECK: bfi
224; CHECK: bfi
225; CHECK-NOT: bfi
226; CHECK-NOT: or
227; CHECK: lsl
228 %conv = zext i8 %a to i32 ; 0 0 0 A
229 %shl = shl i32 %b, 8 ; B2 B1 B0 0
230 %or = or i32 %conv, %shl ; B2 B1 B0 A
231 %shl.1 = shl i32 %or, 8 ; B1 B0 A 0
232 %or.1 = or i32 %conv, %shl.1 ; B1 B0 A A
233 %shl.2 = shl i32 %or.1, 8 ; B0 A A 0
234 %or.2 = or i32 %conv, %shl.2 ; B0 A A A
235 %shl.3 = shl i32 %or.2, 8 ; A A A 0
236 %or.3 = or i32 %conv, %shl.3 ; A A A A
237 %shl.4 = shl i32 %or.3, 8 ; A A A 0
238 ret i32 %shl.4
239}