blob: ac34d31b97c1b65efad2b515f3c9f5473ba9b4a0 [file] [log] [blame]
Tom Stellard49f8bfd2015-01-06 18:00:21 +00001;RUN: llc < %s -march=amdgcn -mcpu=verde -verify-machineinstrs | FileCheck %s
Marek Olsak75170772015-01-27 17:27:15 +00002;RUN: llc < %s -march=amdgcn -mcpu=tonga -verify-machineinstrs | FileCheck %s
Marek Olsak51b8e7b2014-06-18 22:00:29 +00003
Tom Stellard79243d92014-10-01 17:15:17 +00004;CHECK-LABEL: {{^}}getlod:
Nikolay Haustov2f684f12016-02-26 09:51:05 +00005;CHECK: image_get_lod {{v\[[0-9]+:[0-9]+\]}}, {{v[0-9]+}}, {{s\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}} dmask:0x3 da
Nicolai Haehnledf3a20c2016-04-06 19:40:20 +00006define amdgpu_ps void @getlod() {
Marek Olsak51b8e7b2014-06-18 22:00:29 +00007main_body:
Matt Arsenaultc5f61522016-01-26 04:43:48 +00008 %r = call <4 x float> @llvm.SI.getlod.i32(i32 undef, <8 x i32> undef, <4 x i32> undef, i32 15, i32 0, i32 0, i32 1, i32 0, i32 0, i32 0, i32 0)
Marek Olsak51b8e7b2014-06-18 22:00:29 +00009 %r0 = extractelement <4 x float> %r, i32 0
10 %r1 = extractelement <4 x float> %r, i32 1
11 call void @llvm.SI.export(i32 15, i32 1, i32 1, i32 0, i32 1, float %r0, float %r1, float %r0, float %r1)
12 ret void
13}
14
Tom Stellard79243d92014-10-01 17:15:17 +000015;CHECK-LABEL: {{^}}getlod_v2:
Nikolay Haustov2f684f12016-02-26 09:51:05 +000016;CHECK: image_get_lod {{v\[[0-9]+:[0-9]+\]}}, {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}} dmask:0x3 da
Nicolai Haehnledf3a20c2016-04-06 19:40:20 +000017define amdgpu_ps void @getlod_v2() {
Marek Olsak51b8e7b2014-06-18 22:00:29 +000018main_body:
Matt Arsenaultc5f61522016-01-26 04:43:48 +000019 %r = call <4 x float> @llvm.SI.getlod.v2i32(<2 x i32> undef, <8 x i32> undef, <4 x i32> undef, i32 15, i32 0, i32 0, i32 1, i32 0, i32 0, i32 0, i32 0)
Marek Olsak51b8e7b2014-06-18 22:00:29 +000020 %r0 = extractelement <4 x float> %r, i32 0
21 %r1 = extractelement <4 x float> %r, i32 1
22 call void @llvm.SI.export(i32 15, i32 1, i32 1, i32 0, i32 1, float %r0, float %r1, float %r0, float %r1)
23 ret void
24}
25
Tom Stellard79243d92014-10-01 17:15:17 +000026;CHECK-LABEL: {{^}}getlod_v4:
Nikolay Haustov2f684f12016-02-26 09:51:05 +000027;CHECK: image_get_lod {{v\[[0-9]+:[0-9]+\]}}, {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}} dmask:0x3 da
Nicolai Haehnledf3a20c2016-04-06 19:40:20 +000028define amdgpu_ps void @getlod_v4() {
Marek Olsak51b8e7b2014-06-18 22:00:29 +000029main_body:
Matt Arsenaultc5f61522016-01-26 04:43:48 +000030 %r = call <4 x float> @llvm.SI.getlod.v4i32(<4 x i32> undef, <8 x i32> undef, <4 x i32> undef, i32 15, i32 0, i32 0, i32 1, i32 0, i32 0, i32 0, i32 0)
Marek Olsak51b8e7b2014-06-18 22:00:29 +000031 %r0 = extractelement <4 x float> %r, i32 0
32 %r1 = extractelement <4 x float> %r, i32 1
33 call void @llvm.SI.export(i32 15, i32 1, i32 1, i32 0, i32 1, float %r0, float %r1, float %r0, float %r1)
34 ret void
35}
36
37
Nicolai Haehnledf3a20c2016-04-06 19:40:20 +000038declare <4 x float> @llvm.SI.getlod.i32(i32, <8 x i32>, <4 x i32>, i32, i32, i32, i32, i32, i32, i32, i32) #0
39declare <4 x float> @llvm.SI.getlod.v2i32(<2 x i32>, <8 x i32>, <4 x i32>, i32, i32, i32, i32, i32, i32, i32, i32) #0
40declare <4 x float> @llvm.SI.getlod.v4i32(<4 x i32>, <8 x i32>, <4 x i32>, i32, i32, i32, i32, i32, i32, i32, i32) #0
Marek Olsak51b8e7b2014-06-18 22:00:29 +000041
42declare void @llvm.SI.export(i32, i32, i32, i32, i32, float, float, float, float)
43
Nicolai Haehnledf3a20c2016-04-06 19:40:20 +000044attributes #0 = { nounwind readnone }