Hao Liu | a2ff698 | 2013-04-18 09:11:08 +0000 | [diff] [blame] | 1 | ; RUN: llc < %s -mtriple=thumbv7-none-linux-gnueabi -mcpu=cortex-a9 -mattr=+neon,+neonfp | FileCheck %s |
| 2 | ; PR14824. The test is presented by Jiangning Liu. If the ld/st optimization algorithm is changed, this test case may fail. |
| 3 | ; Also if the machine code for ld/st optimizor is changed, this test case may fail. If so, remove this test. |
| 4 | |
| 5 | define void @sample_test(<8 x i64> * %secondSource, <8 x i64> * %source, <8 x i64> * %dest) nounwind { |
| 6 | ; CHECK: sample_test |
| 7 | ; CHECK-NOT: vldmia |
| 8 | ; CHECK: add |
| 9 | entry: |
| 10 | |
| 11 | ; Load %source |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 12 | %s0 = load <8 x i64> , <8 x i64> * %source, align 64 |
David Blaikie | 79e6c74 | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 13 | %arrayidx64 = getelementptr inbounds <8 x i64>, <8 x i64> * %source, i32 6 |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 14 | %s120 = load <8 x i64> , <8 x i64> * %arrayidx64, align 64 |
Hao Liu | a2ff698 | 2013-04-18 09:11:08 +0000 | [diff] [blame] | 15 | %s122 = bitcast <8 x i64> %s120 to i512 |
| 16 | %data.i.i677.48.extract.shift = lshr i512 %s122, 384 |
| 17 | %data.i.i677.48.extract.trunc = trunc i512 %data.i.i677.48.extract.shift to i64 |
| 18 | %s123 = insertelement <8 x i64> undef, i64 %data.i.i677.48.extract.trunc, i32 0 |
| 19 | %data.i.i677.32.extract.shift = lshr i512 %s122, 256 |
| 20 | %data.i.i677.32.extract.trunc = trunc i512 %data.i.i677.32.extract.shift to i64 |
| 21 | %s124 = insertelement <8 x i64> %s123, i64 %data.i.i677.32.extract.trunc, i32 1 |
| 22 | %data.i.i677.16.extract.shift = lshr i512 %s122, 128 |
| 23 | %data.i.i677.16.extract.trunc = trunc i512 %data.i.i677.16.extract.shift to i64 |
| 24 | %s125 = insertelement <8 x i64> %s124, i64 %data.i.i677.16.extract.trunc, i32 2 |
| 25 | %data.i.i677.56.extract.shift = lshr i512 %s122, 448 |
| 26 | %data.i.i677.56.extract.trunc = trunc i512 %data.i.i677.56.extract.shift to i64 |
| 27 | %s126 = insertelement <8 x i64> %s125, i64 %data.i.i677.56.extract.trunc, i32 3 |
| 28 | %data.i.i677.24.extract.shift = lshr i512 %s122, 192 |
| 29 | %data.i.i677.24.extract.trunc = trunc i512 %data.i.i677.24.extract.shift to i64 |
| 30 | %s127 = insertelement <8 x i64> %s126, i64 %data.i.i677.24.extract.trunc, i32 4 |
| 31 | %s128 = insertelement <8 x i64> %s127, i64 %data.i.i677.32.extract.trunc, i32 5 |
| 32 | %s129 = insertelement <8 x i64> %s128, i64 %data.i.i677.16.extract.trunc, i32 6 |
| 33 | %s130 = insertelement <8 x i64> %s129, i64 %data.i.i677.56.extract.trunc, i32 7 |
| 34 | |
| 35 | ; Load %secondSource |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 36 | %s1 = load <8 x i64> , <8 x i64> * %secondSource, align 64 |
David Blaikie | 79e6c74 | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 37 | %arrayidx67 = getelementptr inbounds <8 x i64>, <8 x i64> * %secondSource, i32 6 |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 38 | %s121 = load <8 x i64> , <8 x i64> * %arrayidx67, align 64 |
Hao Liu | a2ff698 | 2013-04-18 09:11:08 +0000 | [diff] [blame] | 39 | %s131 = bitcast <8 x i64> %s121 to i512 |
| 40 | %data.i1.i676.48.extract.shift = lshr i512 %s131, 384 |
| 41 | %data.i1.i676.48.extract.trunc = trunc i512 %data.i1.i676.48.extract.shift to i64 |
| 42 | %s132 = insertelement <8 x i64> undef, i64 %data.i1.i676.48.extract.trunc, i32 0 |
| 43 | %data.i1.i676.32.extract.shift = lshr i512 %s131, 256 |
| 44 | %data.i1.i676.32.extract.trunc = trunc i512 %data.i1.i676.32.extract.shift to i64 |
| 45 | %s133 = insertelement <8 x i64> %s132, i64 %data.i1.i676.32.extract.trunc, i32 1 |
| 46 | %data.i1.i676.16.extract.shift = lshr i512 %s131, 128 |
| 47 | %data.i1.i676.16.extract.trunc = trunc i512 %data.i1.i676.16.extract.shift to i64 |
| 48 | %s134 = insertelement <8 x i64> %s133, i64 %data.i1.i676.16.extract.trunc, i32 2 |
| 49 | %data.i1.i676.56.extract.shift = lshr i512 %s131, 448 |
| 50 | %data.i1.i676.56.extract.trunc = trunc i512 %data.i1.i676.56.extract.shift to i64 |
| 51 | %s135 = insertelement <8 x i64> %s134, i64 %data.i1.i676.56.extract.trunc, i32 3 |
| 52 | %data.i1.i676.24.extract.shift = lshr i512 %s131, 192 |
| 53 | %data.i1.i676.24.extract.trunc = trunc i512 %data.i1.i676.24.extract.shift to i64 |
| 54 | %s136 = insertelement <8 x i64> %s135, i64 %data.i1.i676.24.extract.trunc, i32 4 |
| 55 | %s137 = insertelement <8 x i64> %s136, i64 %data.i1.i676.32.extract.trunc, i32 5 |
| 56 | %s138 = insertelement <8 x i64> %s137, i64 %data.i1.i676.16.extract.trunc, i32 6 |
| 57 | %s139 = insertelement <8 x i64> %s138, i64 %data.i1.i676.56.extract.trunc, i32 7 |
| 58 | |
| 59 | ; Operations about %Source and %secondSource |
| 60 | %vecinit28.i.i699 = shufflevector <8 x i64> %s139, <8 x i64> %s130, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 12, i32 undef, i32 undef, i32 undef> |
| 61 | %vecinit35.i.i700 = shufflevector <8 x i64> %vecinit28.i.i699, <8 x i64> %s139, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 13, i32 undef, i32 undef> |
| 62 | %vecinit42.i.i701 = shufflevector <8 x i64> %vecinit35.i.i700, <8 x i64> %s139, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 14, i32 undef> |
| 63 | %vecinit49.i.i702 = shufflevector <8 x i64> %vecinit42.i.i701, <8 x i64> %s130, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 15> |
David Blaikie | 79e6c74 | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 64 | %arrayidx72 = getelementptr inbounds <8 x i64>, <8 x i64> * %dest, i32 6 |
Hao Liu | a2ff698 | 2013-04-18 09:11:08 +0000 | [diff] [blame] | 65 | store <8 x i64> %vecinit49.i.i702, <8 x i64> * %arrayidx72, align 64 |
David Blaikie | 79e6c74 | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 66 | %arrayidx78 = getelementptr inbounds <8 x i64>, <8 x i64> * %secondSource, i32 7 |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame] | 67 | %s141 = load <8 x i64> , <8 x i64> * %arrayidx78, align 64 |
Hao Liu | a2ff698 | 2013-04-18 09:11:08 +0000 | [diff] [blame] | 68 | %s151 = bitcast <8 x i64> %s141 to i512 |
| 69 | %data.i1.i649.32.extract.shift = lshr i512 %s151, 256 |
| 70 | %data.i1.i649.32.extract.trunc = trunc i512 %data.i1.i649.32.extract.shift to i64 |
| 71 | %s152 = insertelement <8 x i64> undef, i64 %data.i1.i649.32.extract.trunc, i32 0 |
| 72 | %s153 = insertelement <8 x i64> %s152, i64 %data.i1.i649.32.extract.trunc, i32 1 |
| 73 | %data.i1.i649.16.extract.shift = lshr i512 %s151, 128 |
| 74 | %data.i1.i649.16.extract.trunc = trunc i512 %data.i1.i649.16.extract.shift to i64 |
| 75 | %s154 = insertelement <8 x i64> %s153, i64 %data.i1.i649.16.extract.trunc, i32 2 |
| 76 | %data.i1.i649.8.extract.shift = lshr i512 %s151, 64 |
| 77 | %data.i1.i649.8.extract.trunc = trunc i512 %data.i1.i649.8.extract.shift to i64 |
| 78 | %s155 = insertelement <8 x i64> %s154, i64 %data.i1.i649.8.extract.trunc, i32 3 |
David Blaikie | 79e6c74 | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 79 | %arrayidx83 = getelementptr inbounds <8 x i64>, <8 x i64> * %dest, i32 7 |
Hao Liu | a2ff698 | 2013-04-18 09:11:08 +0000 | [diff] [blame] | 80 | store <8 x i64> %s155, <8 x i64> * %arrayidx83, align 64 |
| 81 | ret void |
| 82 | } |