blob: 81a8f496c25414c0f939ac1791c760906a7b6f32 [file] [log] [blame]
Tobias Grossercdb38e52015-05-29 17:08:19 +00001; RUN: opt %loadPolly -polly-import-jscop -polly-import-jscop-dir=%S -polly-codegen -S < %s | FileCheck %s
Tobias Grossercb73f152015-06-03 06:31:30 +00002; RUN: opt %loadPolly -polly-import-jscop -polly-import-jscop-dir=%S -polly-codegen -polly-import-jscop-postfix=pow2 -S < %s | FileCheck %s -check-prefix=POW2
Tobias Grossercdb38e52015-05-29 17:08:19 +00003;
4; void exprModDiv(float *A, float *B, float *C, long N, long p) {
5; for (long i = 0; i < N; i++)
6; C[i] += A[i] + B[i] + A[p] + B[p];
7; }
8;
9;
10; This test case changes the access functions such that the resulting index
11; expressions are modulo or division operations. We test that the code we
12; generate takes advantage of knowledge about unsigned numerators. This is
13; useful as LLVM will translate urem and udiv operations with power-of-two
14; denominators to fast bitwise and or shift operations.
15
Tobias Grossercb73f152015-06-03 06:31:30 +000016; A[i % 127]
17; CHECK: %pexp.pdiv_r = urem i64 %polly.indvar, 127
Tobias Grossercdb38e52015-05-29 17:08:19 +000018; CHECK: %polly.access.A6 = getelementptr float, float* %A, i64 %pexp.pdiv_r
19
Tobias Grossercb73f152015-06-03 06:31:30 +000020; A[i / 127]
21; CHECK: %pexp.div = sdiv i64 %polly.indvar, 127
Tobias Grossercdb38e52015-05-29 17:08:19 +000022; CHECK: %polly.access.B8 = getelementptr float, float* %B, i64 %pexp.div
23;
24; FIXME: Make isl mark this as an udiv expression.
25
26; #define floord(n,d) ((n < 0) ? (n - d + 1) : n) / d
Tobias Grossercb73f152015-06-03 06:31:30 +000027; A[p + 127 * floord(-p - 1, 127) + 127]
Tobias Grossercdb38e52015-05-29 17:08:19 +000028; CHECK: %20 = sub nsw i64 0, %p
29; CHECK: %21 = sub nsw i64 %20, 1
Tobias Grossercb73f152015-06-03 06:31:30 +000030; CHECK: %pexp.fdiv_q.0 = sub i64 %21, 127
Tobias Grossercdb38e52015-05-29 17:08:19 +000031; CHECK: %pexp.fdiv_q.1 = add i64 %pexp.fdiv_q.0, 1
32; CHECK: %pexp.fdiv_q.2 = icmp slt i64 %21, 0
33; CHECK: %pexp.fdiv_q.3 = select i1 %pexp.fdiv_q.2, i64 %pexp.fdiv_q.1, i64 %21
Tobias Grossercb73f152015-06-03 06:31:30 +000034; CHECK: %pexp.fdiv_q.4 = sdiv i64 %pexp.fdiv_q.3, 127
35; CHECK: %22 = mul nsw i64 127, %pexp.fdiv_q.4
Tobias Grossercdb38e52015-05-29 17:08:19 +000036; CHECK: %23 = add nsw i64 %p, %22
Tobias Grossercb73f152015-06-03 06:31:30 +000037; CHECK: %24 = add nsw i64 %23, 127
Tobias Grossercdb38e52015-05-29 17:08:19 +000038; CHECK: %polly.access.A10 = getelementptr float, float* %A, i64 %24
39
Tobias Grossercb73f152015-06-03 06:31:30 +000040; A[p / 127]
41; CHECK: %pexp.div12 = sdiv i64 %p, 127
Tobias Grossercdb38e52015-05-29 17:08:19 +000042; CHECK: %polly.access.B13 = getelementptr float, float* %B, i64 %pexp.div12
43
Tobias Grossercb73f152015-06-03 06:31:30 +000044; A[i % 128]
45; POW2: %pexp.pdiv_r = urem i64 %polly.indvar, 128
46; POW2: %polly.access.A6 = getelementptr float, float* %A, i64 %pexp.pdiv_r
47
48; A[i / 128]
Tobias Grosser244c8292015-06-03 15:14:58 +000049; POW2: %pexp.div.shr = ashr i64 %polly.indvar, 7
Tobias Grossercb73f152015-06-03 06:31:30 +000050; POW2: %polly.access.B8 = getelementptr float, float* %B, i64 %pexp.div
Tobias Grossercb73f152015-06-03 06:31:30 +000051
52; #define floord(n,d) ((n < 0) ? (n - d + 1) : n) / d
53; A[p + 128 * floord(-p - 1, 128) + 128]
54; POW2: %20 = sub nsw i64 0, %p
55; POW2: %21 = sub nsw i64 %20, 1
56; POW2: %polly.fdiv_q.shr = ashr i64 %21, 7
57; POW2: %22 = mul nsw i64 128, %polly.fdiv_q.shr
58; POW2: %23 = add nsw i64 %p, %22
59; POW2: %24 = add nsw i64 %23, 128
60; POW2: %polly.access.A10 = getelementptr float, float* %A, i64 %24
61
62; A[p / 128]
Tobias Grosser244c8292015-06-03 15:14:58 +000063; POW2: %pexp.div.shr12 = ashr i64 %p, 7
64; POW2: %polly.access.B13 = getelementptr float, float* %B, i64 %pexp.div.shr12
Tobias Grossercb73f152015-06-03 06:31:30 +000065
Tobias Grossercdb38e52015-05-29 17:08:19 +000066target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
67
68define void @exprModDiv(float* %A, float* %B, float* %C, i64 %N, i64 %p) {
69entry:
70 br label %for.cond
71
72for.cond: ; preds = %for.inc, %entry
73 %i.0 = phi i64 [ 0, %entry ], [ %inc, %for.inc ]
74 %cmp = icmp slt i64 %i.0, %N
75 br i1 %cmp, label %for.body, label %for.end
76
77for.body: ; preds = %for.cond
78 %arrayidx = getelementptr inbounds float, float* %A, i64 %i.0
79 %tmp = load float, float* %arrayidx, align 4
80 %arrayidx1 = getelementptr inbounds float, float* %B, i64 %i.0
81 %tmp1 = load float, float* %arrayidx1, align 4
82 %add = fadd float %tmp, %tmp1
83 %arrayidx2 = getelementptr inbounds float, float* %A, i64 %p
84 %tmp2 = load float, float* %arrayidx2, align 4
85 %add3 = fadd float %add, %tmp2
86 %arrayidx4 = getelementptr inbounds float, float* %B, i64 %p
87 %tmp3 = load float, float* %arrayidx4, align 4
88 %add5 = fadd float %add3, %tmp3
89 %arrayidx6 = getelementptr inbounds float, float* %C, i64 %i.0
90 %tmp4 = load float, float* %arrayidx6, align 4
91 %add7 = fadd float %tmp4, %add5
92 store float %add7, float* %arrayidx6, align 4
93 br label %for.inc
94
95for.inc: ; preds = %for.body
96 %inc = add nuw nsw i64 %i.0, 1
97 br label %for.cond
98
99for.end: ; preds = %for.cond
100 ret void
101}