Krzysztof Parzyszek | 47ab1f2 | 2015-03-18 16:23:44 +0000 | [diff] [blame] | 1 | ; RUN: llc -march=hexagon -verify-machineinstrs=true < %s | FileCheck %s |
| 2 | ; Testing for these 5 variants of circular store: |
| 3 | ; Q6_circ_store_update_B(inputLR, pDelay, -1, nConvLength, 4); |
| 4 | ; Q6_circ_store_update_D(inputLR, pDelay, -1, nConvLength, 4); |
| 5 | ; Q6_circ_store_update_HL(inputLR, pDelay, -1, nConvLength, 4); |
| 6 | ; Q6_circ_store_update_HH(inputLR, pDelay, -1, nConvLength, 4); |
| 7 | ; Q6_circ_store_update_W(inputLR, pDelay, -1, nConvLength, 4); |
| 8 | ; producing these |
| 9 | ; memb(r1++#-1:circ(m0)) = r3 |
| 10 | ; memd(r1++#-8:circ(m0)) = r1:0 |
| 11 | ; memh(r1++#-2:circ(m0)) = r3 |
| 12 | ; memh(r1++#-2:circ(m0)) = r3.h |
| 13 | ; memw(r1++#-4:circ(m0)) = r0 |
| 14 | |
| 15 | ; ModuleID = 'circ_st.i' |
| 16 | target datalayout = "e-p:32:32:32-i64:64:64-i32:32:32-i16:16:16-i1:32:32-f64:64:64-f32:32:32-v64:64:64-v32:32:32-a0:0-n16:32" |
| 17 | target triple = "hexagon" |
| 18 | |
| 19 | define zeroext i8 @foo1(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind { |
| 20 | entry: |
| 21 | %conv = zext i16 %filtMemLen to i32 |
| 22 | %shr2 = lshr i32 %conv, 1 |
| 23 | %idxprom = sext i16 %filtMemIndex to i32 |
| 24 | %arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom |
| 25 | %0 = bitcast i16* %arrayidx to i8* |
| 26 | %or = or i32 %shr2, 33554432 |
| 27 | ; CHECK: memb(r{{[0-9]*}}{{.}}++{{.}}#-1:circ(m{{[0-1]}})) |
| 28 | %1 = tail call i8* @llvm.hexagon.circ.stb(i8* %0, i32 0, i32 %or, i32 -1) |
| 29 | %2 = load i8, i8* %1, align 1, !tbaa !0 |
| 30 | ret i8 %2 |
| 31 | } |
| 32 | |
| 33 | declare i8* @llvm.hexagon.circ.stb(i8*, i32, i32, i32) nounwind |
| 34 | |
| 35 | define i64 @foo2(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind { |
| 36 | entry: |
| 37 | %conv = zext i16 %filtMemLen to i32 |
| 38 | %shr1 = lshr i32 %conv, 1 |
| 39 | %idxprom = sext i16 %filtMemIndex to i32 |
| 40 | %arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom |
| 41 | %0 = bitcast i16* %arrayidx to i8* |
| 42 | %shl = shl nuw nsw i32 %shr1, 3 |
| 43 | %or = or i32 %shl, 83886080 |
| 44 | ; CHECK: memd(r{{[0-9]*}}{{.}}++{{.}}#-8:circ(m{{[0-1]}})) |
| 45 | %1 = tail call i8* @llvm.hexagon.circ.std(i8* %0, i64 undef, i32 %or, i32 -8) |
| 46 | %2 = bitcast i8* %1 to i64* |
| 47 | %3 = load i64, i64* %2, align 8, !tbaa !0 |
| 48 | ret i64 %3 |
| 49 | } |
| 50 | |
| 51 | declare i8* @llvm.hexagon.circ.std(i8*, i64, i32, i32) nounwind |
| 52 | |
| 53 | define signext i16 @foo3(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind { |
| 54 | entry: |
| 55 | %conv = zext i16 %filtMemLen to i32 |
| 56 | %shr2 = and i32 %conv, 65534 |
| 57 | %idxprom = sext i16 %filtMemIndex to i32 |
| 58 | %arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom |
| 59 | %0 = bitcast i16* %arrayidx to i8* |
| 60 | %or = or i32 %shr2, 50331648 |
| 61 | ; CHECK: memh(r{{[0-9]*}}{{.}}++{{.}}#-2:circ(m{{[0-1]}})) |
| 62 | %1 = tail call i8* @llvm.hexagon.circ.sth(i8* %0, i32 0, i32 %or, i32 -2) |
| 63 | %2 = bitcast i8* %1 to i16* |
| 64 | %3 = load i16, i16* %2, align 2, !tbaa !2 |
| 65 | ret i16 %3 |
| 66 | } |
| 67 | |
| 68 | declare i8* @llvm.hexagon.circ.sth(i8*, i32, i32, i32) nounwind |
| 69 | |
| 70 | define signext i16 @foo5(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind { |
| 71 | entry: |
| 72 | %conv = zext i16 %filtMemLen to i32 |
| 73 | %shr2 = and i32 %conv, 65534 |
| 74 | %idxprom = sext i16 %filtMemIndex to i32 |
| 75 | %arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom |
| 76 | %0 = bitcast i16* %arrayidx to i8* |
| 77 | %or = or i32 %shr2, 50331648 |
| 78 | ; CHECK: memh(r{{[0-9]*}}{{.}}++{{.}}#-2:circ(m{{[0-1]}})){{ *}}={{ *}}r{{[0-9]*}}.h |
| 79 | %1 = tail call i8* @llvm.hexagon.circ.sthhi(i8* %0, i32 0, i32 %or, i32 -2) |
| 80 | %2 = bitcast i8* %1 to i16* |
| 81 | %3 = load i16, i16* %2, align 2, !tbaa !2 |
| 82 | ret i16 %3 |
| 83 | } |
| 84 | |
| 85 | declare i8* @llvm.hexagon.circ.sthhi(i8*, i32, i32, i32) nounwind |
| 86 | |
| 87 | define i32 @foo6(i16 zeroext %filtMemLen, i16* %filtMemLR, i16 signext %filtMemIndex) nounwind { |
| 88 | entry: |
| 89 | %conv = zext i16 %filtMemLen to i32 |
| 90 | %shr1 = lshr i32 %conv, 1 |
| 91 | %idxprom = sext i16 %filtMemIndex to i32 |
| 92 | %arrayidx = getelementptr inbounds i16, i16* %filtMemLR, i32 %idxprom |
| 93 | %0 = bitcast i16* %arrayidx to i8* |
| 94 | %shl = shl nuw nsw i32 %shr1, 2 |
| 95 | %or = or i32 %shl, 67108864 |
| 96 | ; CHECK: memw(r{{[0-9]*}}{{.}}++{{.}}#-4:circ(m{{[0-1]}})) |
| 97 | %1 = tail call i8* @llvm.hexagon.circ.stw(i8* %0, i32 undef, i32 %or, i32 -4) |
| 98 | %2 = bitcast i8* %1 to i32* |
| 99 | %3 = load i32, i32* %2, align 4, !tbaa !3 |
| 100 | ret i32 %3 |
| 101 | } |
| 102 | |
| 103 | declare i8* @llvm.hexagon.circ.stw(i8*, i32, i32, i32) nounwind |
| 104 | |
| 105 | !0 = !{!"omnipotent char", !1} |
| 106 | !1 = !{!"Simple C/C++ TBAA"} |
| 107 | !2 = !{!"short", !0} |
| 108 | !3 = !{!"int", !0} |