blob: 48d2530e80c65bb561400d90cdc02c10ab73d957 [file] [log] [blame]
Simon Pilgrim33f73972017-05-06 20:53:52 +00001; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=SSE --check-prefix=SSE2
3; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+sse4.2 | FileCheck %s --check-prefix=SSE --check-prefix=SSE42
4; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+avx2 | FileCheck %s --check-prefix=AVX --check-prefix=AVX2
5; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+avx512f | FileCheck %s --check-prefix=AVX --check-prefix=AVX512
6
7define <2 x i64> @PR32907(<2 x i64> %astype.i, <2 x i64> %astype6.i) {
8; SSE-LABEL: PR32907:
9; SSE: # BB#0: # %entry
10; SSE-NEXT: psubq %xmm1, %xmm0
11; SSE-NEXT: movdqa %xmm0, %xmm1
12; SSE-NEXT: psrad $31, %xmm1
13; SSE-NEXT: pshufd {{.*#+}} xmm2 = xmm1[1,1,3,3]
14; SSE-NEXT: pxor %xmm1, %xmm1
15; SSE-NEXT: psubq %xmm0, %xmm1
16; SSE-NEXT: pand %xmm2, %xmm1
17; SSE-NEXT: pandn %xmm0, %xmm2
18; SSE-NEXT: por %xmm2, %xmm1
19; SSE-NEXT: movdqa %xmm1, %xmm0
20; SSE-NEXT: retq
21;
22; AVX2-LABEL: PR32907:
23; AVX2: # BB#0: # %entry
24; AVX2-NEXT: vpsubq %xmm1, %xmm0, %xmm0
25; AVX2-NEXT: vpsrad $31, %xmm0, %xmm1
26; AVX2-NEXT: vpshufd {{.*#+}} xmm1 = xmm1[1,1,3,3]
27; AVX2-NEXT: vpxor %xmm2, %xmm2, %xmm2
28; AVX2-NEXT: vpsubq %xmm0, %xmm2, %xmm2
29; AVX2-NEXT: vpandn %xmm0, %xmm1, %xmm0
30; AVX2-NEXT: vpand %xmm2, %xmm1, %xmm1
31; AVX2-NEXT: vpor %xmm1, %xmm0, %xmm0
32; AVX2-NEXT: retq
33;
34; AVX512-LABEL: PR32907:
35; AVX512: # BB#0: # %entry
36; AVX512-NEXT: vpsubq %xmm1, %xmm0, %xmm0
37; AVX512-NEXT: vpsraq $63, %zmm0, %zmm1
Simon Pilgrimdf39b032017-05-08 14:16:39 +000038; AVX512-NEXT: vpxor %xmm1, %xmm0, %xmm0
39; AVX512-NEXT: vpsubq %xmm1, %xmm0, %xmm0
Simon Pilgrim33f73972017-05-06 20:53:52 +000040; AVX512-NEXT: vzeroupper
41; AVX512-NEXT: retq
42entry:
43 %sub13.i = sub <2 x i64> %astype.i, %astype6.i
44 %x.lobit.i.i = ashr <2 x i64> %sub13.i, <i64 63, i64 63>
45 %sub.i.i = sub <2 x i64> zeroinitializer, %sub13.i
46 %0 = xor <2 x i64> %x.lobit.i.i, <i64 -1, i64 -1>
47 %1 = and <2 x i64> %sub13.i, %0
48 %2 = and <2 x i64> %x.lobit.i.i, %sub.i.i
49 %cond.i.i = or <2 x i64> %1, %2
50 ret <2 x i64> %cond.i.i
51}