Blame - llvm/test/CodeGen/AArch64/merge-store.ll - toolchain/llvm-project

blob: 86f5edd5da1d4b03d1f9afb0310006bbda7c0aaf [file] [log] [blame]

Akira Hatanaka	4cb3d06	2015-04-08 23:02:45 +0000	[diff] [blame]	1	; RUN: llc -march aarch64 %s -o - \| FileCheck %s
Sanjay Patel	bbbf9a1	2015-09-25 21:49:48 +0000	[diff] [blame]	2	; RUN: llc < %s -mtriple=aarch64-unknown-unknown -mcpu=cyclone \| FileCheck %s --check-prefix=CYCLONE
Akira Hatanaka	c6fab80	2015-04-08 20:34:53 +0000	[diff] [blame]	3
				4	@g0 = external global <3 x float>, align 16
				5	@g1 = external global <3 x float>, align 4
				6
				7	; CHECK: ldr s[[R0:[0-9]+]], {{\[}}[[R1:x[0-9]+]]{{\]}}, #4
Akira Hatanaka	4cb3d06	2015-04-08 23:02:45 +0000	[diff] [blame]	8	; CHECK: ld1{{\.?s?}} { v[[R0]]{{\.?s?}} }[1], {{\[}}[[R1]]{{\]}}
Akira Hatanaka	c6fab80	2015-04-08 20:34:53 +0000	[diff] [blame]	9	; CHECK: str d[[R0]]
				10
				11	define void @blam() {
				12	%tmp4 = getelementptr inbounds <3 x float>, <3 x float>* @g1, i64 0, i64 0
				13	%tmp5 = load <3 x float>, <3 x float>* @g0, align 16
				14	%tmp6 = extractelement <3 x float> %tmp5, i64 0
				15	store float %tmp6, float* %tmp4
				16	%tmp7 = getelementptr inbounds float, float* %tmp4, i64 1
				17	%tmp8 = load <3 x float>, <3 x float>* @g0, align 16
				18	%tmp9 = extractelement <3 x float> %tmp8, i64 1
				19	store float %tmp9, float* %tmp7
				20	ret void;
				21	}
Sanjay Patel	bbbf9a1	2015-09-25 21:49:48 +0000	[diff] [blame]	22
				23
				24	; PR21711 - Merge vector stores into wider vector stores.
				25
				26	; On Cyclone, the stores should not get merged into a 16-byte store because
				27	; unaligned 16-byte stores are slow. This test would infinite loop when
				28	; the fastness of unaligned accesses was not specified correctly.
				29
				30	define void @merge_vec_extract_stores(<4 x float> %v1, <2 x float>* %ptr) {
				31	%idx0 = getelementptr inbounds <2 x float>, <2 x float>* %ptr, i64 3
				32	%idx1 = getelementptr inbounds <2 x float>, <2 x float>* %ptr, i64 4
				33
				34	%shuffle0 = shufflevector <4 x float> %v1, <4 x float> undef, <2 x i32> <i32 0, i32 1>
				35	%shuffle1 = shufflevector <4 x float> %v1, <4 x float> undef, <2 x i32> <i32 2, i32 3>
				36
				37	store <2 x float> %shuffle0, <2 x float>* %idx0, align 8
				38	store <2 x float> %shuffle1, <2 x float>* %idx1, align 8
				39	ret void
				40
				41	; CHECK-LABEL: merge_vec_extract_stores
				42	; CHECK: stur q0, [x0, #24]
				43	; CHECK-NEXT: ret
				44
				45	; CYCLONE-LABEL: merge_vec_extract_stores
				46	; CYCLONE: ext v1.16b, v0.16b, v0.16b, #8
				47	; CYCLONE-NEXT: str d0, [x0, #24]
				48	; CYCLONE-NEXT: str d1, [x0, #32]
				49	; CYCLONE-NEXT: ret
				50	}