Krzysztof Parzyszek | 97a5095 | 2018-02-06 20:18:58 +0000 | [diff] [blame] | 1 | ; RUN: llc -march=hexagon < %s | FileCheck %s |
| 2 | |
| 3 | ; This code generates a concat_vectors with more than 2 inputs. Make sure |
| 4 | ; that this compiles successfully. |
| 5 | ; CHECK: vlsr |
| 6 | |
| 7 | target datalayout = "e-m:e-p:32:32:32-a:0-n16:32-i64:64:64-i32:32:32-i16:16:16-i1:8:8-f32:32:32-f64:64:64-v32:32:32-v64:64:64-v512:512:512-v1024:1024:1024-v2048:2048:2048" |
| 8 | target triple = "hexagon" |
| 9 | |
Krzysztof Parzyszek | d91a9e2 | 2018-08-02 22:17:53 +0000 | [diff] [blame] | 10 | define void @fred(i32* %a0, i32* %a1, i8* %a2) #0 { |
Krzysztof Parzyszek | 97a5095 | 2018-02-06 20:18:58 +0000 | [diff] [blame] | 11 | b0: |
Krzysztof Parzyszek | d91a9e2 | 2018-08-02 22:17:53 +0000 | [diff] [blame] | 12 | %v1 = load i32, i32* %a0, align 4 |
Krzysztof Parzyszek | 97a5095 | 2018-02-06 20:18:58 +0000 | [diff] [blame] | 13 | %v2 = mul nsw i32 %v1, -15137 |
| 14 | %v3 = add nsw i32 0, %v2 |
| 15 | %v4 = sub nsw i32 0, %v3 |
Krzysztof Parzyszek | d91a9e2 | 2018-08-02 22:17:53 +0000 | [diff] [blame] | 16 | %v5 = load i32, i32* %a1, align 4 |
Krzysztof Parzyszek | 97a5095 | 2018-02-06 20:18:58 +0000 | [diff] [blame] | 17 | %v6 = insertelement <2 x i32> undef, i32 %v5, i32 1 |
Sanjay Patel | 25fc03c | 2018-12-14 17:23:01 +0000 | [diff] [blame] | 18 | %v7 = add nsw <2 x i32> %v6, %v6 |
Krzysztof Parzyszek | 97a5095 | 2018-02-06 20:18:58 +0000 | [diff] [blame] | 19 | %v8 = extractelement <2 x i32> %v7, i32 0 |
| 20 | %v9 = insertelement <4 x i32> undef, i32 %v4, i32 2 |
| 21 | %v10 = insertelement <4 x i32> %v9, i32 undef, i32 3 |
Sanjay Patel | 25fc03c | 2018-12-14 17:23:01 +0000 | [diff] [blame] | 22 | %v11 = add <4 x i32> %v10, %v10 |
Krzysztof Parzyszek | 97a5095 | 2018-02-06 20:18:58 +0000 | [diff] [blame] | 23 | %v12 = sub <4 x i32> %v11, zeroinitializer |
| 24 | %v13 = shufflevector <4 x i32> %v12, <4 x i32> undef, <8 x i32> <i32 undef, i32 0, i32 undef, i32 1, i32 undef, i32 2, i32 undef, i32 3> |
| 25 | %v14 = shufflevector <8 x i32> undef, <8 x i32> %v13, <8 x i32> <i32 0, i32 9, i32 2, i32 11, i32 4, i32 13, i32 6, i32 15> |
| 26 | %v15 = lshr <8 x i32> %v14, <i32 18, i32 18, i32 18, i32 18, i32 18, i32 18, i32 18, i32 18> |
Sanjay Patel | 25fc03c | 2018-12-14 17:23:01 +0000 | [diff] [blame] | 27 | %v16 = and <8 x i32> %v15, %v14 |
Krzysztof Parzyszek | 97a5095 | 2018-02-06 20:18:58 +0000 | [diff] [blame] | 28 | %v17 = extractelement <8 x i32> %v16, i32 5 |
| 29 | %v18 = getelementptr inbounds i8, i8* null, i32 %v17 |
| 30 | %v19 = load i8, i8* %v18, align 1 |
Krzysztof Parzyszek | d91a9e2 | 2018-08-02 22:17:53 +0000 | [diff] [blame] | 31 | store i8 %v19, i8* %a2, align 1 |
| 32 | ret void |
Krzysztof Parzyszek | 97a5095 | 2018-02-06 20:18:58 +0000 | [diff] [blame] | 33 | } |
| 34 | |
| 35 | attributes #0 = { nounwind "target-cpu"="hexagonv60" "target-features"="+hvx-length64b,+hvxv60" } |