Exploit non-negative numerators isl marks known non-negative numerators in modulo (and soon also division) operations. We now exploit this by generating unsigned operations. This is beneficial as unsigned operations with power-of-two denominators will be translated by isl to fast bitshift or bitwise and operations. llvm-svn: 238577

commit: cdb38e5625b760aa6634084a45ec563e8ff797e4 [log] [tgz]
author: Tobias Grosser <tobias@grosser.es> Fri May 29 17:08:19 2015 +0000
committer: Tobias Grosser <tobias@grosser.es> Fri May 29 17:08:19 2015 +0000
tree: 4063166e77b941e9e0acbd951f041ad947774b03
parent: 09b832cac54cfa6693523d4a3116ce74640e65ae [diff] [blame]
diff --git a/polly/test/Isl/CodeGen/exprModDiv.ll b/polly/test/Isl/CodeGen/exprModDiv.ll
new file mode 100644
index 0000000..e471e6b
--- /dev/null
+++ b/polly/test/Isl/CodeGen/exprModDiv.ll

@@ -0,0 +1,78 @@
+; RUN: opt %loadPolly -polly-import-jscop -polly-import-jscop-dir=%S -polly-codegen -S < %s | FileCheck %s
+;
+;    void exprModDiv(float *A, float *B, float *C, long N, long p) {
+;      for (long i = 0; i < N; i++)
+;        C[i] += A[i] + B[i] + A[p] + B[p];
+;    }
+;
+;
+; This test case changes the access functions such that the resulting index
+; expressions are modulo or division operations. We test that the code we
+; generate takes advantage of knowledge about unsigned numerators. This is
+; useful as LLVM will translate urem and udiv operations with power-of-two
+; denominators to fast bitwise and or shift operations.
+
+; A[i % 128]
+; CHECK:  %pexp.pdiv_r = urem i64 %polly.indvar, 128
+; CHECK:  %polly.access.A6 = getelementptr float, float* %A, i64 %pexp.pdiv_r
+
+; A[i / 128]
+; CHECK:  %pexp.div = sdiv i64 %polly.indvar, 128
+; CHECK:  %polly.access.B8 = getelementptr float, float* %B, i64 %pexp.div
+;
+; FIXME: Make isl mark this as an udiv expression.
+
+; #define floord(n,d) ((n < 0) ? (n - d + 1) : n) / d
+; A[p + 128 * floord(-p - 1, 128) + 128]
+; CHECK:  %20 = sub nsw i64 0, %p
+; CHECK:  %21 = sub nsw i64 %20, 1
+; CHECK:  %pexp.fdiv_q.0 = sub i64 %21, 128
+; CHECK:  %pexp.fdiv_q.1 = add i64 %pexp.fdiv_q.0, 1
+; CHECK:  %pexp.fdiv_q.2 = icmp slt i64 %21, 0
+; CHECK:  %pexp.fdiv_q.3 = select i1 %pexp.fdiv_q.2, i64 %pexp.fdiv_q.1, i64 %21
+; CHECK:  %pexp.fdiv_q.4 = sdiv i64 %pexp.fdiv_q.3, 128
+; CHECK:  %22 = mul nsw i64 128, %pexp.fdiv_q.4
+; CHECK:  %23 = add nsw i64 %p, %22
+; CHECK:  %24 = add nsw i64 %23, 128
+; CHECK:  %polly.access.A10 = getelementptr float, float* %A, i64 %24
+
+; A[p / 128]
+; CHECK:  %pexp.div12 = sdiv i64 %p, 128
+; CHECK:  %polly.access.B13 = getelementptr float, float* %B, i64 %pexp.div12
+
+target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
+
+define void @exprModDiv(float* %A, float* %B, float* %C, i64 %N, i64 %p) {
+entry:
+  br label %for.cond
+
+for.cond:                                         ; preds = %for.inc, %entry
+  %i.0 = phi i64 [ 0, %entry ], [ %inc, %for.inc ]
+  %cmp = icmp slt i64 %i.0, %N
+  br i1 %cmp, label %for.body, label %for.end
+
+for.body:                                         ; preds = %for.cond
+  %arrayidx = getelementptr inbounds float, float* %A, i64 %i.0
+  %tmp = load float, float* %arrayidx, align 4
+  %arrayidx1 = getelementptr inbounds float, float* %B, i64 %i.0
+  %tmp1 = load float, float* %arrayidx1, align 4
+  %add = fadd float %tmp, %tmp1
+  %arrayidx2 = getelementptr inbounds float, float* %A, i64 %p
+  %tmp2 = load float, float* %arrayidx2, align 4
+  %add3 = fadd float %add, %tmp2
+  %arrayidx4 = getelementptr inbounds float, float* %B, i64 %p
+  %tmp3 = load float, float* %arrayidx4, align 4
+  %add5 = fadd float %add3, %tmp3
+  %arrayidx6 = getelementptr inbounds float, float* %C, i64 %i.0
+  %tmp4 = load float, float* %arrayidx6, align 4
+  %add7 = fadd float %tmp4, %add5
+  store float %add7, float* %arrayidx6, align 4
+  br label %for.inc
+
+for.inc:                                          ; preds = %for.body
+  %inc = add nuw nsw i64 %i.0, 1
+  br label %for.cond
+
+for.end:                                          ; preds = %for.cond
+  ret void
+}
commit	cdb38e5625b760aa6634084a45ec563e8ff797e4	[log] [tgz]
author	Tobias Grosser <tobias@grosser.es>	Fri May 29 17:08:19 2015 +0000
committer	Tobias Grosser <tobias@grosser.es>	Fri May 29 17:08:19 2015 +0000
tree	4063166e77b941e9e0acbd951f041ad947774b03
parent	09b832cac54cfa6693523d4a3116ce74640e65ae [diff] [blame]