blob: d398dfe7fc922f23cbcb17a2707b02f3087deaa7 [file] [log] [blame]
Sanjay Patel7a522962017-06-06 22:06:07 +00001; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
Zaara Syeda3a7578c2017-05-31 17:12:38 +00002; RUN: llc -verify-machineinstrs -mcpu=pwr8 < %s | FileCheck %s
3target datalayout = "e-m:e-i64:64-n32:64"
4target triple = "powerpc64le-unknown-linux-gnu"
5
6@zeroEqualityTest01.buffer1 = private unnamed_addr constant [3 x i32] [i32 1, i32 2, i32 4], align 4
7@zeroEqualityTest01.buffer2 = private unnamed_addr constant [3 x i32] [i32 1, i32 2, i32 3], align 4
8@zeroEqualityTest02.buffer1 = private unnamed_addr constant [4 x i32] [i32 4, i32 0, i32 0, i32 0], align 4
9@zeroEqualityTest02.buffer2 = private unnamed_addr constant [4 x i32] [i32 3, i32 0, i32 0, i32 0], align 4
10@zeroEqualityTest03.buffer1 = private unnamed_addr constant [4 x i32] [i32 0, i32 0, i32 0, i32 3], align 4
11@zeroEqualityTest03.buffer2 = private unnamed_addr constant [4 x i32] [i32 0, i32 0, i32 0, i32 4], align 4
12@zeroEqualityTest04.buffer1 = private unnamed_addr constant [15 x i32] [i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14], align 4
13@zeroEqualityTest04.buffer2 = private unnamed_addr constant [15 x i32] [i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 13], align 4
14
Zaara Syeda3a7578c2017-05-31 17:12:38 +000015declare signext i32 @memcmp(i8* nocapture, i8* nocapture, i64) local_unnamed_addr #1
16
Sanjay Patel7a522962017-06-06 22:06:07 +000017; Check 4 bytes - requires 1 load for each param.
18define signext i32 @zeroEqualityTest02(i8* %x, i8* %y) {
19; CHECK-LABEL: zeroEqualityTest02:
Sanjay Patele7c50412017-06-08 16:53:18 +000020; CHECK: # BB#0:
Sanjay Patel7a522962017-06-06 22:06:07 +000021; CHECK-NEXT: lwz 3, 0(3)
22; CHECK-NEXT: lwz 4, 0(4)
Sanjay Patele7c50412017-06-08 16:53:18 +000023; CHECK-NEXT: xor 3, 3, 4
24; CHECK-NEXT: cntlzw 3, 3
25; CHECK-NEXT: srwi 3, 3, 5
26; CHECK-NEXT: xori 3, 3, 1
Sanjay Patel7a522962017-06-06 22:06:07 +000027; CHECK-NEXT: blr
28 %call = tail call signext i32 @memcmp(i8* %x, i8* %y, i64 4)
Zaara Syeda3a7578c2017-05-31 17:12:38 +000029 %not.cmp = icmp ne i32 %call, 0
30 %. = zext i1 %not.cmp to i32
31 ret i32 %.
Sanjay Patel7a522962017-06-06 22:06:07 +000032}
Zaara Syeda3a7578c2017-05-31 17:12:38 +000033
Sanjay Patel7a522962017-06-06 22:06:07 +000034; Check 16 bytes - requires 2 loads for each param (or use vectors?).
35define signext i32 @zeroEqualityTest01(i8* %x, i8* %y) {
36; CHECK-LABEL: zeroEqualityTest01:
37; CHECK: # BB#0: # %loadbb
38; CHECK-NEXT: ld 5, 0(3)
39; CHECK-NEXT: ld 6, 0(4)
Sanjay Patelf57015d2017-06-07 00:17:08 +000040; CHECK-NEXT: cmpld 5, 6
Sanjay Patel7a522962017-06-06 22:06:07 +000041; CHECK-NEXT: bne 0, .LBB1_2
42; CHECK-NEXT: # BB#1: # %loadbb1
43; CHECK-NEXT: ld 3, 8(3)
44; CHECK-NEXT: ld 4, 8(4)
Sanjay Patelf57015d2017-06-07 00:17:08 +000045; CHECK-NEXT: cmpld 3, 4
46; CHECK-NEXT: li 3, 0
Sanjay Patel7a522962017-06-06 22:06:07 +000047; CHECK-NEXT: beq 0, .LBB1_3
48; CHECK-NEXT: .LBB1_2: # %res_block
49; CHECK-NEXT: li 3, 1
50; CHECK-NEXT: clrldi 3, 3, 32
51; CHECK-NEXT: blr
Sanjay Patelf57015d2017-06-07 00:17:08 +000052; CHECK-NEXT: .LBB1_3: # %endblock
Sanjay Patel7a522962017-06-06 22:06:07 +000053; CHECK-NEXT: clrldi 3, 3, 32
54; CHECK-NEXT: blr
55 %call = tail call signext i32 @memcmp(i8* %x, i8* %y, i64 16)
56 %not.tobool = icmp ne i32 %call, 0
57 %. = zext i1 %not.tobool to i32
58 ret i32 %.
59}
60
61; Check 7 bytes - requires 3 loads for each param.
62define signext i32 @zeroEqualityTest03(i8* %x, i8* %y) {
63; CHECK-LABEL: zeroEqualityTest03:
64; CHECK: # BB#0: # %loadbb
65; CHECK-NEXT: lwz 5, 0(3)
66; CHECK-NEXT: lwz 6, 0(4)
Sanjay Patel8ce1e3b2017-06-07 16:16:45 +000067; CHECK-NEXT: cmplw 5, 6
Sanjay Patel7a522962017-06-06 22:06:07 +000068; CHECK-NEXT: bne 0, .LBB2_3
69; CHECK-NEXT: # BB#1: # %loadbb1
70; CHECK-NEXT: lhz 5, 4(3)
71; CHECK-NEXT: lhz 6, 4(4)
Sanjay Patel8ce1e3b2017-06-07 16:16:45 +000072; CHECK-NEXT: cmplw 5, 6
Sanjay Patel7a522962017-06-06 22:06:07 +000073; CHECK-NEXT: bne 0, .LBB2_3
74; CHECK-NEXT: # BB#2: # %loadbb2
75; CHECK-NEXT: lbz 3, 6(3)
76; CHECK-NEXT: lbz 4, 6(4)
Sanjay Patel8ce1e3b2017-06-07 16:16:45 +000077; CHECK-NEXT: cmplw 3, 4
Sanjay Patelf57015d2017-06-07 00:17:08 +000078; CHECK-NEXT: li 3, 0
Sanjay Patel7a522962017-06-06 22:06:07 +000079; CHECK-NEXT: beq 0, .LBB2_4
80; CHECK-NEXT: .LBB2_3: # %res_block
81; CHECK-NEXT: li 3, 1
82; CHECK-NEXT: clrldi 3, 3, 32
83; CHECK-NEXT: blr
Sanjay Patelf57015d2017-06-07 00:17:08 +000084; CHECK-NEXT: .LBB2_4: # %endblock
Sanjay Patel7a522962017-06-06 22:06:07 +000085; CHECK-NEXT: clrldi 3, 3, 32
86; CHECK-NEXT: blr
87 %call = tail call signext i32 @memcmp(i8* %x, i8* %y, i64 7)
88 %not.lnot = icmp ne i32 %call, 0
89 %cond = zext i1 %not.lnot to i32
90 ret i32 %cond
Zaara Syeda3a7578c2017-05-31 17:12:38 +000091}
92
93; Validate with > 0
Sanjay Patel7a522962017-06-06 22:06:07 +000094define signext i32 @zeroEqualityTest04() {
95; CHECK-LABEL: zeroEqualityTest04:
96; CHECK: # BB#0: # %loadbb
97; CHECK-NEXT: addis 3, 2, .LzeroEqualityTest02.buffer1@toc@ha
98; CHECK-NEXT: addis 4, 2, .LzeroEqualityTest02.buffer2@toc@ha
99; CHECK-NEXT: addi 6, 3, .LzeroEqualityTest02.buffer1@toc@l
100; CHECK-NEXT: addi 5, 4, .LzeroEqualityTest02.buffer2@toc@l
101; CHECK-NEXT: ldbrx 3, 0, 6
102; CHECK-NEXT: ldbrx 4, 0, 5
103; CHECK-NEXT: subf. 7, 4, 3
104; CHECK-NEXT: bne 0, .LBB3_2
105; CHECK-NEXT: # BB#1: # %loadbb1
106; CHECK-NEXT: li 4, 8
107; CHECK-NEXT: ldbrx 3, 6, 4
108; CHECK-NEXT: ldbrx 4, 5, 4
109; CHECK-NEXT: subf. 5, 4, 3
110; CHECK-NEXT: beq 0, .LBB3_4
111; CHECK-NEXT: .LBB3_2: # %res_block
112; CHECK-NEXT: cmpld 3, 4
113; CHECK-NEXT: li 3, 1
114; CHECK-NEXT: li 12, -1
115; CHECK-NEXT: isel 3, 12, 3, 0
116; CHECK-NEXT: .LBB3_3: # %endblock
117; CHECK-NEXT: cmpwi 3, 1
118; CHECK-NEXT: li 3, 0
119; CHECK-NEXT: li 4, 1
120; CHECK-NEXT: isel 3, 4, 3, 0
121; CHECK-NEXT: blr
122; CHECK-NEXT: .LBB3_4:
123; CHECK-NEXT: li 3, 0
124; CHECK-NEXT: b .LBB3_3
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000125 %call = tail call signext i32 @memcmp(i8* bitcast ([4 x i32]* @zeroEqualityTest02.buffer1 to i8*), i8* bitcast ([4 x i32]* @zeroEqualityTest02.buffer2 to i8*), i64 16)
126 %not.cmp = icmp slt i32 %call, 1
127 %. = zext i1 %not.cmp to i32
128 ret i32 %.
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000129}
130
131; Validate with < 0
Sanjay Patel7a522962017-06-06 22:06:07 +0000132define signext i32 @zeroEqualityTest05() {
133; CHECK-LABEL: zeroEqualityTest05:
134; CHECK: # BB#0: # %loadbb
135; CHECK-NEXT: addis 3, 2, .LzeroEqualityTest03.buffer1@toc@ha
136; CHECK-NEXT: addis 4, 2, .LzeroEqualityTest03.buffer2@toc@ha
137; CHECK-NEXT: addi 6, 3, .LzeroEqualityTest03.buffer1@toc@l
138; CHECK-NEXT: addi 5, 4, .LzeroEqualityTest03.buffer2@toc@l
139; CHECK-NEXT: ldbrx 3, 0, 6
140; CHECK-NEXT: ldbrx 4, 0, 5
141; CHECK-NEXT: subf. 7, 4, 3
142; CHECK-NEXT: bne 0, .LBB4_2
143; CHECK-NEXT: # BB#1: # %loadbb1
144; CHECK-NEXT: li 4, 8
145; CHECK-NEXT: ldbrx 3, 6, 4
146; CHECK-NEXT: ldbrx 4, 5, 4
147; CHECK-NEXT: subf. 5, 4, 3
148; CHECK-NEXT: beq 0, .LBB4_4
149; CHECK-NEXT: .LBB4_2: # %res_block
150; CHECK-NEXT: cmpld 3, 4
151; CHECK-NEXT: li 3, 1
152; CHECK-NEXT: li 12, -1
153; CHECK-NEXT: isel 3, 12, 3, 0
154; CHECK-NEXT: .LBB4_3: # %endblock
155; CHECK-NEXT: srwi 3, 3, 31
156; CHECK-NEXT: xori 3, 3, 1
157; CHECK-NEXT: clrldi 3, 3, 32
158; CHECK-NEXT: blr
159; CHECK-NEXT: .LBB4_4:
160; CHECK-NEXT: li 3, 0
161; CHECK-NEXT: b .LBB4_3
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000162 %call = tail call signext i32 @memcmp(i8* bitcast ([4 x i32]* @zeroEqualityTest03.buffer1 to i8*), i8* bitcast ([4 x i32]* @zeroEqualityTest03.buffer2 to i8*), i64 16)
163 %call.lobit = lshr i32 %call, 31
164 %call.lobit.not = xor i32 %call.lobit, 1
165 ret i32 %call.lobit.not
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000166}
167
168; Validate with memcmp()?:
Sanjay Pateldd962702017-06-09 23:15:14 +0000169define signext i32 @equalityFoldTwoConstants() {
170; CHECK-LABEL: equalityFoldTwoConstants:
Sanjay Patela351a612017-06-19 19:48:35 +0000171; CHECK: # BB#0: # %endblock
Sanjay Patel7a522962017-06-06 22:06:07 +0000172; CHECK-NEXT: li 3, 1
Sanjay Patel7a522962017-06-06 22:06:07 +0000173; CHECK-NEXT: blr
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000174 %call = tail call signext i32 @memcmp(i8* bitcast ([15 x i32]* @zeroEqualityTest04.buffer1 to i8*), i8* bitcast ([15 x i32]* @zeroEqualityTest04.buffer2 to i8*), i64 16)
175 %not.tobool = icmp eq i32 %call, 0
176 %cond = zext i1 %not.tobool to i32
177 ret i32 %cond
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000178}
179
Sanjay Pateldd962702017-06-09 23:15:14 +0000180define signext i32 @equalityFoldOneConstant(i8* %X) {
181; CHECK-LABEL: equalityFoldOneConstant:
182; CHECK: # BB#0: # %loadbb
Sanjay Patela351a612017-06-19 19:48:35 +0000183; CHECK-NEXT: li 4, 1
Sanjay Pateldd962702017-06-09 23:15:14 +0000184; CHECK-NEXT: ld 5, 0(3)
Sanjay Patela351a612017-06-19 19:48:35 +0000185; CHECK-NEXT: sldi 4, 4, 32
186; CHECK-NEXT: cmpld 5, 4
Sanjay Pateldd962702017-06-09 23:15:14 +0000187; CHECK-NEXT: bne 0, .LBB6_2
188; CHECK-NEXT: # BB#1: # %loadbb1
Sanjay Patela351a612017-06-19 19:48:35 +0000189; CHECK-NEXT: li 4, 3
Sanjay Pateldd962702017-06-09 23:15:14 +0000190; CHECK-NEXT: ld 3, 8(3)
Sanjay Patela351a612017-06-19 19:48:35 +0000191; CHECK-NEXT: sldi 4, 4, 32
192; CHECK-NEXT: ori 4, 4, 2
193; CHECK-NEXT: cmpld 3, 4
Sanjay Pateldd962702017-06-09 23:15:14 +0000194; CHECK-NEXT: li 3, 0
195; CHECK-NEXT: beq 0, .LBB6_3
196; CHECK-NEXT: .LBB6_2: # %res_block
197; CHECK-NEXT: li 3, 1
198; CHECK-NEXT: .LBB6_3: # %endblock
199; CHECK-NEXT: cntlzw 3, 3
200; CHECK-NEXT: srwi 3, 3, 5
201; CHECK-NEXT: blr
202 %call = tail call signext i32 @memcmp(i8* bitcast ([15 x i32]* @zeroEqualityTest04.buffer1 to i8*), i8* %X, i64 16)
203 %not.tobool = icmp eq i32 %call, 0
204 %cond = zext i1 %not.tobool to i32
205 ret i32 %cond
206}
207
Sanjay Patel0edcd1d2017-06-08 17:09:18 +0000208define i1 @length2_eq_nobuiltin_attr(i8* %X, i8* %Y) {
209; CHECK-LABEL: length2_eq_nobuiltin_attr:
210; CHECK: # BB#0:
Sanjay Patel5e370852017-06-08 19:47:25 +0000211; CHECK-NEXT: mflr 0
212; CHECK-NEXT: std 0, 16(1)
213; CHECK-NEXT: stdu 1, -32(1)
214; CHECK-NEXT: .Lcfi0:
215; CHECK-NEXT: .cfi_def_cfa_offset 32
216; CHECK-NEXT: .Lcfi1:
217; CHECK-NEXT: .cfi_offset lr, 16
218; CHECK-NEXT: li 5, 2
219; CHECK-NEXT: bl memcmp
220; CHECK-NEXT: nop
221; CHECK-NEXT: cntlzw 3, 3
222; CHECK-NEXT: rlwinm 3, 3, 27, 31, 31
223; CHECK-NEXT: addi 1, 1, 32
224; CHECK-NEXT: ld 0, 16(1)
225; CHECK-NEXT: mtlr 0
Sanjay Patel0edcd1d2017-06-08 17:09:18 +0000226; CHECK-NEXT: blr
227 %m = tail call signext i32 @memcmp(i8* %X, i8* %Y, i64 2) nobuiltin
228 %c = icmp eq i32 %m, 0
229 ret i1 %c
230}
231