Two more test cases: or_ops.ll (arithmetic or operations) and vecinsert.ll
(vector insertions)


git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@45216 91177308-0d34-0410-b5e6-96231b3b80d8
diff --git a/test/CodeGen/CellSPU/vecinsert.ll b/test/CodeGen/CellSPU/vecinsert.ll
new file mode 100644
index 0000000..104a205
--- /dev/null
+++ b/test/CodeGen/CellSPU/vecinsert.ll
@@ -0,0 +1,53 @@
+; RUN: llvm-as -o - %s | llc -march=cellspu > %t1.s
+; RUN: grep cbd     %t1.s | count 3 &&
+; RUN: grep chd     %t1.s | count 3 &&
+; RUN: grep cwd     %t1.s | count 6 &&
+; RUN: grep il      %t1.s | count 4 &&
+; RUN: grep ilh     %t1.s | count 3 &&
+; RUN: grep iohl    %t1.s | count 1 &&
+; RUN: grep ilhu    %t1.s | count 1 &&
+; RUN: grep shufb   %t1.s | count 12 &&
+; RUN: grep 17219   %t1.s | count 1 &&
+; RUN: grep 22598   %t1.s | count 1 &&
+; RUN: grep -- -39  %t1.s | count 1 &&
+; RUN: grep    24   %t1.s | count 1 &&
+; RUN: grep  1159   %t1.s | count 1
+; ModuleID = 'vecinsert.bc'
+target datalayout = "E-p:32:32:128-f64:64:128-f32:32:128-i64:32:128-i32:32:128-i16:16:128-i8:8:128-i1:8:128-a0:0:128-v128:128:128"
+target triple = "spu-unknown-elf"
+
+; 67 -> 0x43, as 8-bit vector constant load = 0x4343 (17219)0x4343
+define <16 x i8> @test_v16i8(<16 x i8> %P, i8 %x) {
+entry:
+ 	%tmp1 = insertelement <16 x i8> %P, i8 %x, i32 10
+ 	%tmp1.1 = insertelement <16 x i8> %tmp1, i8 67, i32 7
+ 	%tmp1.2 = insertelement <16 x i8> %tmp1.1, i8 %x, i32 15
+	ret <16 x i8> %tmp1.2
+}
+
+; 22598 -> 0x5846
+define <8 x i16> @test_v8i16(<8 x i16> %P, i16 %x) {
+entry:
+ 	%tmp1 = insertelement <8 x i16> %P, i16 %x, i32 5
+ 	%tmp1.1 = insertelement <8 x i16> %tmp1, i16 22598, i32 7
+ 	%tmp1.2 = insertelement <8 x i16> %tmp1.1, i16 %x, i32 2
+	ret <8 x i16> %tmp1.2
+}
+
+; 1574023 -> 0x180487 (ILHU 24/IOHL 1159)
+define <4 x i32> @test_v4i32_1(<4 x i32> %P, i32 %x) {
+entry:
+ 	%tmp1 = insertelement <4 x i32> %P, i32 %x, i32 2
+ 	%tmp1.1 = insertelement <4 x i32> %tmp1, i32 1574023, i32 1
+ 	%tmp1.2 = insertelement <4 x i32> %tmp1.1, i32 %x, i32 3
+	ret <4 x i32> %tmp1.2
+}
+
+; Should generate IL for the load
+define <4 x i32> @test_v4i32_2(<4 x i32> %P, i32 %x) {
+entry:
+ 	%tmp1 = insertelement <4 x i32> %P, i32 %x, i32 2
+ 	%tmp1.1 = insertelement <4 x i32> %tmp1, i32 -39, i32 1
+ 	%tmp1.2 = insertelement <4 x i32> %tmp1.1, i32 %x, i32 3
+	ret <4 x i32> %tmp1.2
+}