blob: 27e9c1b8819d85f1c1eef4a55e64311fdac97655 [file] [log] [blame]
Nemanja Ivanovice22ebea2017-09-26 20:42:47 +00001; XFAIL: *
Sanjay Patel7a522962017-06-06 22:06:07 +00002; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
Zaara Syeda3a7578c2017-05-31 17:12:38 +00003; RUN: llc -verify-machineinstrs -mcpu=pwr8 < %s | FileCheck %s
4target datalayout = "e-m:e-i64:64-n32:64"
5target triple = "powerpc64le-unknown-linux-gnu"
6
7@zeroEqualityTest01.buffer1 = private unnamed_addr constant [3 x i32] [i32 1, i32 2, i32 4], align 4
8@zeroEqualityTest01.buffer2 = private unnamed_addr constant [3 x i32] [i32 1, i32 2, i32 3], align 4
9@zeroEqualityTest02.buffer1 = private unnamed_addr constant [4 x i32] [i32 4, i32 0, i32 0, i32 0], align 4
10@zeroEqualityTest02.buffer2 = private unnamed_addr constant [4 x i32] [i32 3, i32 0, i32 0, i32 0], align 4
11@zeroEqualityTest03.buffer1 = private unnamed_addr constant [4 x i32] [i32 0, i32 0, i32 0, i32 3], align 4
12@zeroEqualityTest03.buffer2 = private unnamed_addr constant [4 x i32] [i32 0, i32 0, i32 0, i32 4], align 4
13@zeroEqualityTest04.buffer1 = private unnamed_addr constant [15 x i32] [i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14], align 4
14@zeroEqualityTest04.buffer2 = private unnamed_addr constant [15 x i32] [i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 13], align 4
15
Zaara Syeda3a7578c2017-05-31 17:12:38 +000016declare signext i32 @memcmp(i8* nocapture, i8* nocapture, i64) local_unnamed_addr #1
17
Sanjay Patel7a522962017-06-06 22:06:07 +000018; Check 4 bytes - requires 1 load for each param.
19define signext i32 @zeroEqualityTest02(i8* %x, i8* %y) {
20; CHECK-LABEL: zeroEqualityTest02:
Sanjay Patele7c50412017-06-08 16:53:18 +000021; CHECK: # BB#0:
Sanjay Patel7a522962017-06-06 22:06:07 +000022; CHECK-NEXT: lwz 3, 0(3)
23; CHECK-NEXT: lwz 4, 0(4)
Sanjay Patele7c50412017-06-08 16:53:18 +000024; CHECK-NEXT: xor 3, 3, 4
25; CHECK-NEXT: cntlzw 3, 3
26; CHECK-NEXT: srwi 3, 3, 5
27; CHECK-NEXT: xori 3, 3, 1
Sanjay Patel7a522962017-06-06 22:06:07 +000028; CHECK-NEXT: blr
29 %call = tail call signext i32 @memcmp(i8* %x, i8* %y, i64 4)
Zaara Syeda3a7578c2017-05-31 17:12:38 +000030 %not.cmp = icmp ne i32 %call, 0
31 %. = zext i1 %not.cmp to i32
32 ret i32 %.
Sanjay Patel7a522962017-06-06 22:06:07 +000033}
Zaara Syeda3a7578c2017-05-31 17:12:38 +000034
Sanjay Patel7a522962017-06-06 22:06:07 +000035; Check 16 bytes - requires 2 loads for each param (or use vectors?).
36define signext i32 @zeroEqualityTest01(i8* %x, i8* %y) {
37; CHECK-LABEL: zeroEqualityTest01:
38; CHECK: # BB#0: # %loadbb
39; CHECK-NEXT: ld 5, 0(3)
40; CHECK-NEXT: ld 6, 0(4)
Sanjay Patelf57015d2017-06-07 00:17:08 +000041; CHECK-NEXT: cmpld 5, 6
Sanjay Patel7a522962017-06-06 22:06:07 +000042; CHECK-NEXT: bne 0, .LBB1_2
43; CHECK-NEXT: # BB#1: # %loadbb1
44; CHECK-NEXT: ld 3, 8(3)
45; CHECK-NEXT: ld 4, 8(4)
Sanjay Patelf57015d2017-06-07 00:17:08 +000046; CHECK-NEXT: cmpld 3, 4
47; CHECK-NEXT: li 3, 0
Hiroshi Inouee3a3e3c2017-10-16 04:12:57 +000048; CHECK-NEXT: beqlr 0
Sanjay Patel7a522962017-06-06 22:06:07 +000049; CHECK-NEXT: .LBB1_2: # %res_block
50; CHECK-NEXT: li 3, 1
Sanjay Patel7a522962017-06-06 22:06:07 +000051; CHECK-NEXT: blr
52 %call = tail call signext i32 @memcmp(i8* %x, i8* %y, i64 16)
53 %not.tobool = icmp ne i32 %call, 0
54 %. = zext i1 %not.tobool to i32
55 ret i32 %.
56}
57
58; Check 7 bytes - requires 3 loads for each param.
59define signext i32 @zeroEqualityTest03(i8* %x, i8* %y) {
60; CHECK-LABEL: zeroEqualityTest03:
61; CHECK: # BB#0: # %loadbb
62; CHECK-NEXT: lwz 5, 0(3)
63; CHECK-NEXT: lwz 6, 0(4)
Sanjay Patel8ce1e3b2017-06-07 16:16:45 +000064; CHECK-NEXT: cmplw 5, 6
Sanjay Patel7a522962017-06-06 22:06:07 +000065; CHECK-NEXT: bne 0, .LBB2_3
66; CHECK-NEXT: # BB#1: # %loadbb1
67; CHECK-NEXT: lhz 5, 4(3)
68; CHECK-NEXT: lhz 6, 4(4)
Sanjay Patel8ce1e3b2017-06-07 16:16:45 +000069; CHECK-NEXT: cmplw 5, 6
Sanjay Patel7a522962017-06-06 22:06:07 +000070; CHECK-NEXT: bne 0, .LBB2_3
71; CHECK-NEXT: # BB#2: # %loadbb2
72; CHECK-NEXT: lbz 3, 6(3)
73; CHECK-NEXT: lbz 4, 6(4)
Sanjay Patel8ce1e3b2017-06-07 16:16:45 +000074; CHECK-NEXT: cmplw 3, 4
Sanjay Patelf57015d2017-06-07 00:17:08 +000075; CHECK-NEXT: li 3, 0
Hiroshi Inouee3a3e3c2017-10-16 04:12:57 +000076; CHECK-NEXT: beqlr 0
Sanjay Patel7a522962017-06-06 22:06:07 +000077; CHECK-NEXT: .LBB2_3: # %res_block
78; CHECK-NEXT: li 3, 1
Sanjay Patel7a522962017-06-06 22:06:07 +000079; CHECK-NEXT: blr
80 %call = tail call signext i32 @memcmp(i8* %x, i8* %y, i64 7)
81 %not.lnot = icmp ne i32 %call, 0
82 %cond = zext i1 %not.lnot to i32
83 ret i32 %cond
Zaara Syeda3a7578c2017-05-31 17:12:38 +000084}
85
86; Validate with > 0
Sanjay Patel7a522962017-06-06 22:06:07 +000087define signext i32 @zeroEqualityTest04() {
88; CHECK-LABEL: zeroEqualityTest04:
89; CHECK: # BB#0: # %loadbb
90; CHECK-NEXT: addis 3, 2, .LzeroEqualityTest02.buffer1@toc@ha
91; CHECK-NEXT: addis 4, 2, .LzeroEqualityTest02.buffer2@toc@ha
92; CHECK-NEXT: addi 6, 3, .LzeroEqualityTest02.buffer1@toc@l
93; CHECK-NEXT: addi 5, 4, .LzeroEqualityTest02.buffer2@toc@l
94; CHECK-NEXT: ldbrx 3, 0, 6
95; CHECK-NEXT: ldbrx 4, 0, 5
Sanjay Patel70b36f12017-06-27 21:46:34 +000096; CHECK-NEXT: cmpld 3, 4
Sanjay Patel7a522962017-06-06 22:06:07 +000097; CHECK-NEXT: bne 0, .LBB3_2
98; CHECK-NEXT: # BB#1: # %loadbb1
99; CHECK-NEXT: li 4, 8
100; CHECK-NEXT: ldbrx 3, 6, 4
101; CHECK-NEXT: ldbrx 4, 5, 4
Sanjay Patel70b36f12017-06-27 21:46:34 +0000102; CHECK-NEXT: li 5, 0
103; CHECK-NEXT: cmpld 3, 4
104; CHECK-NEXT: beq 0, .LBB3_3
Sanjay Patel7a522962017-06-06 22:06:07 +0000105; CHECK-NEXT: .LBB3_2: # %res_block
106; CHECK-NEXT: cmpld 3, 4
Sanjay Patel70b36f12017-06-27 21:46:34 +0000107; CHECK-NEXT: li 11, 1
Sanjay Patel7a522962017-06-06 22:06:07 +0000108; CHECK-NEXT: li 12, -1
Sanjay Patel70b36f12017-06-27 21:46:34 +0000109; CHECK-NEXT: isel 5, 12, 11, 0
Sanjay Patel7a522962017-06-06 22:06:07 +0000110; CHECK-NEXT: .LBB3_3: # %endblock
Nemanja Ivanovic41c4a102017-09-23 04:41:34 +0000111; CHECK-NEXT: neg 3, 5
112; CHECK-NEXT: rldicl 3, 3, 1, 63
113; CHECK-NEXT: xori 3, 3, 1
Sanjay Patel7a522962017-06-06 22:06:07 +0000114; CHECK-NEXT: blr
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000115 %call = tail call signext i32 @memcmp(i8* bitcast ([4 x i32]* @zeroEqualityTest02.buffer1 to i8*), i8* bitcast ([4 x i32]* @zeroEqualityTest02.buffer2 to i8*), i64 16)
116 %not.cmp = icmp slt i32 %call, 1
117 %. = zext i1 %not.cmp to i32
118 ret i32 %.
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000119}
120
121; Validate with < 0
Sanjay Patel7a522962017-06-06 22:06:07 +0000122define signext i32 @zeroEqualityTest05() {
123; CHECK-LABEL: zeroEqualityTest05:
124; CHECK: # BB#0: # %loadbb
125; CHECK-NEXT: addis 3, 2, .LzeroEqualityTest03.buffer1@toc@ha
126; CHECK-NEXT: addis 4, 2, .LzeroEqualityTest03.buffer2@toc@ha
127; CHECK-NEXT: addi 6, 3, .LzeroEqualityTest03.buffer1@toc@l
128; CHECK-NEXT: addi 5, 4, .LzeroEqualityTest03.buffer2@toc@l
129; CHECK-NEXT: ldbrx 3, 0, 6
130; CHECK-NEXT: ldbrx 4, 0, 5
Sanjay Patel70b36f12017-06-27 21:46:34 +0000131; CHECK-NEXT: cmpld 3, 4
Sanjay Patel7a522962017-06-06 22:06:07 +0000132; CHECK-NEXT: bne 0, .LBB4_2
133; CHECK-NEXT: # BB#1: # %loadbb1
134; CHECK-NEXT: li 4, 8
135; CHECK-NEXT: ldbrx 3, 6, 4
136; CHECK-NEXT: ldbrx 4, 5, 4
Sanjay Patel70b36f12017-06-27 21:46:34 +0000137; CHECK-NEXT: li 5, 0
138; CHECK-NEXT: cmpld 3, 4
139; CHECK-NEXT: beq 0, .LBB4_3
Sanjay Patel7a522962017-06-06 22:06:07 +0000140; CHECK-NEXT: .LBB4_2: # %res_block
141; CHECK-NEXT: cmpld 3, 4
Sanjay Patel70b36f12017-06-27 21:46:34 +0000142; CHECK-NEXT: li 11, 1
Sanjay Patel7a522962017-06-06 22:06:07 +0000143; CHECK-NEXT: li 12, -1
Sanjay Patel70b36f12017-06-27 21:46:34 +0000144; CHECK-NEXT: isel 5, 12, 11, 0
Sanjay Patel7a522962017-06-06 22:06:07 +0000145; CHECK-NEXT: .LBB4_3: # %endblock
Sanjay Patel70b36f12017-06-27 21:46:34 +0000146; CHECK-NEXT: srwi 3, 5, 31
Sanjay Patel7a522962017-06-06 22:06:07 +0000147; CHECK-NEXT: xori 3, 3, 1
148; CHECK-NEXT: clrldi 3, 3, 32
149; CHECK-NEXT: blr
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000150 %call = tail call signext i32 @memcmp(i8* bitcast ([4 x i32]* @zeroEqualityTest03.buffer1 to i8*), i8* bitcast ([4 x i32]* @zeroEqualityTest03.buffer2 to i8*), i64 16)
151 %call.lobit = lshr i32 %call, 31
152 %call.lobit.not = xor i32 %call.lobit, 1
153 ret i32 %call.lobit.not
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000154}
155
156; Validate with memcmp()?:
Sanjay Pateldd962702017-06-09 23:15:14 +0000157define signext i32 @equalityFoldTwoConstants() {
158; CHECK-LABEL: equalityFoldTwoConstants:
Sanjay Patela351a612017-06-19 19:48:35 +0000159; CHECK: # BB#0: # %endblock
Sanjay Patel7a522962017-06-06 22:06:07 +0000160; CHECK-NEXT: li 3, 1
Sanjay Patel7a522962017-06-06 22:06:07 +0000161; CHECK-NEXT: blr
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000162 %call = tail call signext i32 @memcmp(i8* bitcast ([15 x i32]* @zeroEqualityTest04.buffer1 to i8*), i8* bitcast ([15 x i32]* @zeroEqualityTest04.buffer2 to i8*), i64 16)
163 %not.tobool = icmp eq i32 %call, 0
164 %cond = zext i1 %not.tobool to i32
165 ret i32 %cond
Zaara Syeda3a7578c2017-05-31 17:12:38 +0000166}
167
Sanjay Pateldd962702017-06-09 23:15:14 +0000168define signext i32 @equalityFoldOneConstant(i8* %X) {
169; CHECK-LABEL: equalityFoldOneConstant:
170; CHECK: # BB#0: # %loadbb
Sanjay Patela351a612017-06-19 19:48:35 +0000171; CHECK-NEXT: li 4, 1
Sanjay Pateldd962702017-06-09 23:15:14 +0000172; CHECK-NEXT: ld 5, 0(3)
Sanjay Patela351a612017-06-19 19:48:35 +0000173; CHECK-NEXT: sldi 4, 4, 32
174; CHECK-NEXT: cmpld 5, 4
Sanjay Pateldd962702017-06-09 23:15:14 +0000175; CHECK-NEXT: bne 0, .LBB6_2
176; CHECK-NEXT: # BB#1: # %loadbb1
Sanjay Patela351a612017-06-19 19:48:35 +0000177; CHECK-NEXT: li 4, 3
Sanjay Pateldd962702017-06-09 23:15:14 +0000178; CHECK-NEXT: ld 3, 8(3)
Sanjay Patela351a612017-06-19 19:48:35 +0000179; CHECK-NEXT: sldi 4, 4, 32
180; CHECK-NEXT: ori 4, 4, 2
181; CHECK-NEXT: cmpld 3, 4
Sanjay Pateldd962702017-06-09 23:15:14 +0000182; CHECK-NEXT: li 3, 0
183; CHECK-NEXT: beq 0, .LBB6_3
184; CHECK-NEXT: .LBB6_2: # %res_block
185; CHECK-NEXT: li 3, 1
186; CHECK-NEXT: .LBB6_3: # %endblock
187; CHECK-NEXT: cntlzw 3, 3
188; CHECK-NEXT: srwi 3, 3, 5
189; CHECK-NEXT: blr
190 %call = tail call signext i32 @memcmp(i8* bitcast ([15 x i32]* @zeroEqualityTest04.buffer1 to i8*), i8* %X, i64 16)
191 %not.tobool = icmp eq i32 %call, 0
192 %cond = zext i1 %not.tobool to i32
193 ret i32 %cond
194}
195
Sanjay Patel0edcd1d2017-06-08 17:09:18 +0000196define i1 @length2_eq_nobuiltin_attr(i8* %X, i8* %Y) {
197; CHECK-LABEL: length2_eq_nobuiltin_attr:
198; CHECK: # BB#0:
Sanjay Patel5e370852017-06-08 19:47:25 +0000199; CHECK-NEXT: mflr 0
200; CHECK-NEXT: std 0, 16(1)
201; CHECK-NEXT: stdu 1, -32(1)
Sanjay Patel5e370852017-06-08 19:47:25 +0000202; CHECK-NEXT: .cfi_def_cfa_offset 32
Sanjay Patel5e370852017-06-08 19:47:25 +0000203; CHECK-NEXT: .cfi_offset lr, 16
204; CHECK-NEXT: li 5, 2
205; CHECK-NEXT: bl memcmp
206; CHECK-NEXT: nop
207; CHECK-NEXT: cntlzw 3, 3
208; CHECK-NEXT: rlwinm 3, 3, 27, 31, 31
209; CHECK-NEXT: addi 1, 1, 32
210; CHECK-NEXT: ld 0, 16(1)
211; CHECK-NEXT: mtlr 0
Sanjay Patel0edcd1d2017-06-08 17:09:18 +0000212; CHECK-NEXT: blr
213 %m = tail call signext i32 @memcmp(i8* %X, i8* %Y, i64 2) nobuiltin
214 %c = icmp eq i32 %m, 0
215 ret i1 %c
216}
217