blob: 584c9ea40f5329a1a2f03969dc411a8b640839da [file] [log] [blame]
Sanjay Patel7a522962017-06-06 22:06:07 +00001; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
Zaara Syeda3a7578c2017-05-31 17:12:38 +00002; RUN: llc -verify-machineinstrs -mcpu=pwr8 < %s | FileCheck %s
3target datalayout = "e-m:e-i64:64-n32:64"
4target triple = "powerpc64le-unknown-linux-gnu"
5
6@zeroEqualityTest01.buffer1 = private unnamed_addr constant [3 x i32] [i32 1, i32 2, i32 4], align 4
7@zeroEqualityTest01.buffer2 = private unnamed_addr constant [3 x i32] [i32 1, i32 2, i32 3], align 4
8@zeroEqualityTest02.buffer1 = private unnamed_addr constant [4 x i32] [i32 4, i32 0, i32 0, i32 0], align 4
9@zeroEqualityTest02.buffer2 = private unnamed_addr constant [4 x i32] [i32 3, i32 0, i32 0, i32 0], align 4
10@zeroEqualityTest03.buffer1 = private unnamed_addr constant [4 x i32] [i32 0, i32 0, i32 0, i32 3], align 4
11@zeroEqualityTest03.buffer2 = private unnamed_addr constant [4 x i32] [i32 0, i32 0, i32 0, i32 4], align 4
12@zeroEqualityTest04.buffer1 = private unnamed_addr constant [15 x i32] [i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14], align 4
13@zeroEqualityTest04.buffer2 = private unnamed_addr constant [15 x i32] [i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 13], align 4
14
Zaara Syeda3a7578c2017-05-31 17:12:38 +000015declare signext i32 @memcmp(i8* nocapture, i8* nocapture, i64) local_unnamed_addr #1
16
Sanjay Patel7a522962017-06-06 22:06:07 +000017; Check 4 bytes - requires 1 load for each param.
18define signext i32 @zeroEqualityTest02(i8* %x, i8* %y) {
19; CHECK-LABEL: zeroEqualityTest02:
20; CHECK: # BB#0: # %loadbb
21; CHECK-NEXT: lwz 3, 0(3)
22; CHECK-NEXT: lwz 4, 0(4)
23; CHECK-NEXT: li 5, 1
24; CHECK-NEXT: xor 3, 3, 4
25; CHECK-NEXT: cmplwi 3, 0
26; CHECK-NEXT: isel 3, 0, 5, 2
27; CHECK-NEXT: clrldi 3, 3, 32
28; CHECK-NEXT: blr
29 %call = tail call signext i32 @memcmp(i8* %x, i8* %y, i64 4)
Zaara Syeda3a7578c2017-05-31 17:12:38 +000030 %not.cmp = icmp ne i32 %call, 0
31 %. = zext i1 %not.cmp to i32
32 ret i32 %.
Sanjay Patel7a522962017-06-06 22:06:07 +000033}
Zaara Syeda3a7578c2017-05-31 17:12:38 +000034
Sanjay Patel7a522962017-06-06 22:06:07 +000035; Check 16 bytes - requires 2 loads for each param (or use vectors?).
36define signext i32 @zeroEqualityTest01(i8* %x, i8* %y) {
37; CHECK-LABEL: zeroEqualityTest01:
38; CHECK: # BB#0: # %loadbb
39; CHECK-NEXT: ld 5, 0(3)
40; CHECK-NEXT: ld 6, 0(4)
41; CHECK-NEXT: xor. 5, 5, 6
42; CHECK-NEXT: bne 0, .LBB1_2
43; CHECK-NEXT: # BB#1: # %loadbb1
44; CHECK-NEXT: ld 3, 8(3)
45; CHECK-NEXT: ld 4, 8(4)
46; CHECK-NEXT: xor. 3, 3, 4
47; CHECK-NEXT: beq 0, .LBB1_3
48; CHECK-NEXT: .LBB1_2: # %res_block
49; CHECK-NEXT: li 3, 1
50; CHECK-NEXT: clrldi 3, 3, 32
51; CHECK-NEXT: blr
52; CHECK-NEXT: .LBB1_3:
53; CHECK-NEXT: li 3, 0
54; CHECK-NEXT: clrldi 3, 3, 32
55; CHECK-NEXT: blr
56 %call = tail call signext i32 @memcmp(i8* %x, i8* %y, i64 16)
57 %not.tobool = icmp ne i32 %call, 0
58 %. = zext i1 %not.tobool to i32
59 ret i32 %.
60}
61
62; Check 7 bytes - requires 3 loads for each param.
63define signext i32 @zeroEqualityTest03(i8* %x, i8* %y) {
64; CHECK-LABEL: zeroEqualityTest03:
65; CHECK: # BB#0: # %loadbb
66; CHECK-NEXT: lwz 5, 0(3)
67; CHECK-NEXT: lwz 6, 0(4)
68; CHECK-NEXT: xor 5, 5, 6
69; CHECK-NEXT: cmplwi 5, 0
70; CHECK-NEXT: bne 0, .LBB2_3
71; CHECK-NEXT: # BB#1: # %loadbb1
72; CHECK-NEXT: lhz 5, 4(3)
73; CHECK-NEXT: lhz 6, 4(4)
74; CHECK-NEXT: xor 5, 5, 6
75; CHECK-NEXT: rlwinm. 5, 5, 0, 16, 31
76; CHECK-NEXT: bne 0, .LBB2_3
77; CHECK-NEXT: # BB#2: # %loadbb2
78; CHECK-NEXT: lbz 3, 6(3)
79; CHECK-NEXT: lbz 4, 6(4)
80; CHECK-NEXT: xor 3, 3, 4
81; CHECK-NEXT: rlwinm. 3, 3, 0, 24, 31
82; CHECK-NEXT: beq 0, .LBB2_4
83; CHECK-NEXT: .LBB2_3: # %res_block
84; CHECK-NEXT: li 3, 1
85; CHECK-NEXT: clrldi 3, 3, 32
86; CHECK-NEXT: blr
87; CHECK-NEXT: .LBB2_4:
88; CHECK-NEXT: li 3, 0
89; CHECK-NEXT: clrldi 3, 3, 32
90; CHECK-NEXT: blr
91 %call = tail call signext i32 @memcmp(i8* %x, i8* %y, i64 7)
92 %not.lnot = icmp ne i32 %call, 0
93 %cond = zext i1 %not.lnot to i32
94 ret i32 %cond
Zaara Syeda3a7578c2017-05-31 17:12:38 +000095}
96
97; Validate with > 0
Sanjay Patel7a522962017-06-06 22:06:07 +000098define signext i32 @zeroEqualityTest04() {
99; CHECK-LABEL: zeroEqualityTest04:
100; CHECK: # BB#0: # %loadbb
101; CHECK-NEXT: addis 3, 2, .LzeroEqualityTest02.buffer1@toc@ha
102; CHECK-NEXT: addis 4, 2, .LzeroEqualityTest02.buffer2@toc@ha
103; CHECK-NEXT: addi 6, 3, .LzeroEqualityTest02.buffer1@toc@l
104; CHECK-NEXT: addi 5, 4, .LzeroEqualityTest02.buffer2@toc@l
105; CHECK-NEXT: ldbrx 3, 0, 6
106; CHECK-NEXT: ldbrx 4, 0, 5
107; CHECK-NEXT: subf. 7, 4, 3
108; CHECK-NEXT: bne 0, .LBB3_2
109; CHECK-NEXT: # BB#1: # %loadbb1
110; CHECK-NEXT: li 4, 8
111; CHECK-NEXT: ldbrx 3, 6, 4
112; CHECK-NEXT: ldbrx 4, 5, 4
113; CHECK-NEXT: subf. 5, 4, 3
114; CHECK-NEXT: beq 0, .LBB3_4
115; CHECK-NEXT: .LBB3_2: # %res_block
116; CHECK-NEXT: cmpld 3, 4
117; CHECK-NEXT: li 3, 1
118; CHECK-NEXT: li 12, -1
119; CHECK-NEXT: isel 3, 12, 3, 0
120; CHECK-NEXT: .LBB3_3: # %endblock
121; CHECK-NEXT: cmpwi 3, 1
122; CHECK-NEXT: li 3, 0
123; CHECK-NEXT: li 4, 1
124; CHECK-NEXT: isel 3, 4, 3, 0
125; CHECK-NEXT: blr
126; CHECK-NEXT: .LBB3_4:
127; CHECK-NEXT: li 3, 0
128; CHECK-NEXT: b .LBB3_3
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000129 %call = tail call signext i32 @memcmp(i8* bitcast ([4 x i32]* @zeroEqualityTest02.buffer1 to i8*), i8* bitcast ([4 x i32]* @zeroEqualityTest02.buffer2 to i8*), i64 16)
130 %not.cmp = icmp slt i32 %call, 1
131 %. = zext i1 %not.cmp to i32
132 ret i32 %.
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000133}
134
135; Validate with < 0
Sanjay Patel7a522962017-06-06 22:06:07 +0000136define signext i32 @zeroEqualityTest05() {
137; CHECK-LABEL: zeroEqualityTest05:
138; CHECK: # BB#0: # %loadbb
139; CHECK-NEXT: addis 3, 2, .LzeroEqualityTest03.buffer1@toc@ha
140; CHECK-NEXT: addis 4, 2, .LzeroEqualityTest03.buffer2@toc@ha
141; CHECK-NEXT: addi 6, 3, .LzeroEqualityTest03.buffer1@toc@l
142; CHECK-NEXT: addi 5, 4, .LzeroEqualityTest03.buffer2@toc@l
143; CHECK-NEXT: ldbrx 3, 0, 6
144; CHECK-NEXT: ldbrx 4, 0, 5
145; CHECK-NEXT: subf. 7, 4, 3
146; CHECK-NEXT: bne 0, .LBB4_2
147; CHECK-NEXT: # BB#1: # %loadbb1
148; CHECK-NEXT: li 4, 8
149; CHECK-NEXT: ldbrx 3, 6, 4
150; CHECK-NEXT: ldbrx 4, 5, 4
151; CHECK-NEXT: subf. 5, 4, 3
152; CHECK-NEXT: beq 0, .LBB4_4
153; CHECK-NEXT: .LBB4_2: # %res_block
154; CHECK-NEXT: cmpld 3, 4
155; CHECK-NEXT: li 3, 1
156; CHECK-NEXT: li 12, -1
157; CHECK-NEXT: isel 3, 12, 3, 0
158; CHECK-NEXT: .LBB4_3: # %endblock
159; CHECK-NEXT: srwi 3, 3, 31
160; CHECK-NEXT: xori 3, 3, 1
161; CHECK-NEXT: clrldi 3, 3, 32
162; CHECK-NEXT: blr
163; CHECK-NEXT: .LBB4_4:
164; CHECK-NEXT: li 3, 0
165; CHECK-NEXT: b .LBB4_3
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000166 %call = tail call signext i32 @memcmp(i8* bitcast ([4 x i32]* @zeroEqualityTest03.buffer1 to i8*), i8* bitcast ([4 x i32]* @zeroEqualityTest03.buffer2 to i8*), i64 16)
167 %call.lobit = lshr i32 %call, 31
168 %call.lobit.not = xor i32 %call.lobit, 1
169 ret i32 %call.lobit.not
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000170}
171
172; Validate with memcmp()?:
173; Function Attrs: nounwind readonly
Sanjay Patel7a522962017-06-06 22:06:07 +0000174define signext i32 @zeroEqualityTest06() {
175; CHECK-LABEL: zeroEqualityTest06:
176; CHECK: # BB#0: # %loadbb
177; CHECK-NEXT: addis 3, 2, .LzeroEqualityTest04.buffer1@toc@ha
178; CHECK-NEXT: addis 4, 2, .LzeroEqualityTest04.buffer2@toc@ha
179; CHECK-NEXT: ld 3, .LzeroEqualityTest04.buffer1@toc@l(3)
180; CHECK-NEXT: ld 4, .LzeroEqualityTest04.buffer2@toc@l(4)
181; CHECK-NEXT: xor. 3, 3, 4
182; CHECK-NEXT: bne 0, .LBB5_2
183; CHECK-NEXT: # BB#1: # %loadbb1
184; CHECK-NEXT: addis 3, 2, .LzeroEqualityTest04.buffer1@toc@ha+8
185; CHECK-NEXT: addis 4, 2, .LzeroEqualityTest04.buffer2@toc@ha+8
186; CHECK-NEXT: ld 3, .LzeroEqualityTest04.buffer1@toc@l+8(3)
187; CHECK-NEXT: ld 4, .LzeroEqualityTest04.buffer2@toc@l+8(4)
188; CHECK-NEXT: xor. 3, 3, 4
189; CHECK-NEXT: beq 0, .LBB5_4
190; CHECK-NEXT: .LBB5_2: # %res_block
191; CHECK-NEXT: li 3, 1
192; CHECK-NEXT: .LBB5_3: # %endblock
193; CHECK-NEXT: cntlzw 3, 3
194; CHECK-NEXT: srwi 3, 3, 5
195; CHECK-NEXT: blr
196; CHECK-NEXT: .LBB5_4:
197; CHECK-NEXT: li 3, 0
198; CHECK-NEXT: b .LBB5_3
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000199 %call = tail call signext i32 @memcmp(i8* bitcast ([15 x i32]* @zeroEqualityTest04.buffer1 to i8*), i8* bitcast ([15 x i32]* @zeroEqualityTest04.buffer2 to i8*), i64 16)
200 %not.tobool = icmp eq i32 %call, 0
201 %cond = zext i1 %not.tobool to i32
202 ret i32 %cond
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000203}
204