blob: ee0a41f2210f18c89bb940037b3cc83663eb35e0 [file] [log] [blame]
Matt Arsenaultcaa12882015-02-18 02:04:38 +00001; RUN: llc -march=amdgcn -mcpu=verde -show-mc-encoding -verify-machineinstrs < %s | FileCheck %s
2; RUN: llc -march=amdgcn -mcpu=tonga -show-mc-encoding -verify-machineinstrs < %s | FileCheck %s
Michel Danzer13736222014-01-27 07:20:51 +00003
4; Example of a simple geometry shader loading vertex attributes from the
5; ESGS ring buffer
6
Matt Arsenaultcaa12882015-02-18 02:04:38 +00007; FIXME: Out of bounds immediate offset crashes
Michel Danzer13736222014-01-27 07:20:51 +00008
Matt Arsenaultcaa12882015-02-18 02:04:38 +00009; CHECK-LABEL: {{^}}main:
Nikolay Haustov4f672a32016-04-29 09:02:30 +000010; CHECK: buffer_load_dword {{v[0-9]+}}, off, {{s\[[0-9]+:[0-9]+\]}}, 0 glc slc
Matt Arsenaultcaa12882015-02-18 02:04:38 +000011; CHECK: buffer_load_dword {{v[0-9]+}}, {{v[0-9]+}}, {{s\[[0-9]+:[0-9]+\]}}, 0 offen glc slc
12; CHECK: buffer_load_dword {{v[0-9]+}}, {{v[0-9]+}}, {{s\[[0-9]+:[0-9]+\]}}, 0 idxen glc slc
13; CHECK: buffer_load_dword {{v[0-9]+}}, {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 idxen offen glc slc
14; CHECK: s_movk_i32 [[K:s[0-9]+]], 0x4d2 ; encoding
15; CHECK: buffer_load_dword {{v[0-9]+}}, {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, [[K]] idxen offen offset:65535 glc slc
16
Nicolai Haehnledf3a20c2016-04-06 19:40:20 +000017define amdgpu_vs void @main([17 x <16 x i8>] addrspace(2)* byval %arg, [32 x <16 x i8>] addrspace(2)* byval %arg1, [16 x <32 x i8>] addrspace(2)* byval %arg2, [2 x <16 x i8>] addrspace(2)* byval %arg3, [17 x <16 x i8>] addrspace(2)* inreg %arg4, [17 x <16 x i8>] addrspace(2)* inreg %arg5, i32 %arg6, i32 %arg7, i32 %arg8, i32 %arg9) {
Michel Danzer13736222014-01-27 07:20:51 +000018main_body:
David Blaikie79e6c742015-02-27 19:29:02 +000019 %tmp = getelementptr [2 x <16 x i8>], [2 x <16 x i8>] addrspace(2)* %arg3, i64 0, i32 1
David Blaikiea79ac142015-02-27 21:17:42 +000020 %tmp10 = load <16 x i8>, <16 x i8> addrspace(2)* %tmp, !tbaa !0
Matt Arsenaultcaa12882015-02-18 02:04:38 +000021 %tmp11 = shl i32 %arg6, 2
22 %tmp12 = call i32 @llvm.SI.buffer.load.dword.i32.i32(<16 x i8> %tmp10, i32 0, i32 0, i32 0, i32 0, i32 0, i32 1, i32 1, i32 0)
23 %tmp13 = bitcast i32 %tmp12 to float
24 %tmp14 = call i32 @llvm.SI.buffer.load.dword.i32.i32(<16 x i8> %tmp10, i32 %tmp11, i32 0, i32 0, i32 1, i32 0, i32 1, i32 1, i32 0)
25 %tmp15 = bitcast i32 %tmp14 to float
26 %tmp16 = call i32 @llvm.SI.buffer.load.dword.i32.i32(<16 x i8> %tmp10, i32 %tmp11, i32 0, i32 0, i32 0, i32 1, i32 1, i32 1, i32 0)
27 %tmp17 = bitcast i32 %tmp16 to float
28 %tmp18 = call i32 @llvm.SI.buffer.load.dword.i32.v2i32(<16 x i8> %tmp10, <2 x i32> zeroinitializer, i32 0, i32 0, i32 1, i32 1, i32 1, i32 1, i32 0)
29 %tmp19 = bitcast i32 %tmp18 to float
30
31 %tmp20 = call i32 @llvm.SI.buffer.load.dword.i32.v2i32(<16 x i8> %tmp10, <2 x i32> zeroinitializer, i32 0, i32 123, i32 1, i32 1, i32 1, i32 1, i32 0)
32 %tmp21 = bitcast i32 %tmp20 to float
33
34 %tmp22 = call i32 @llvm.SI.buffer.load.dword.i32.v2i32(<16 x i8> %tmp10, <2 x i32> zeroinitializer, i32 1234, i32 65535, i32 1, i32 1, i32 1, i32 1, i32 0)
35 %tmp23 = bitcast i32 %tmp22 to float
36
37 call void @llvm.SI.export(i32 15, i32 0, i32 1, i32 12, i32 0, float %tmp13, float %tmp15, float %tmp17, float %tmp19)
38 call void @llvm.SI.export(i32 15, i32 0, i32 1, i32 12, i32 0, float %tmp21, float %tmp23, float %tmp23, float %tmp23)
Michel Danzer13736222014-01-27 07:20:51 +000039 ret void
40}
41
42; Function Attrs: nounwind readonly
Nicolai Haehnledf3a20c2016-04-06 19:40:20 +000043declare i32 @llvm.SI.buffer.load.dword.i32.i32(<16 x i8>, i32, i32, i32, i32, i32, i32, i32, i32) #0
Michel Danzer13736222014-01-27 07:20:51 +000044
45; Function Attrs: nounwind readonly
Nicolai Haehnledf3a20c2016-04-06 19:40:20 +000046declare i32 @llvm.SI.buffer.load.dword.i32.v2i32(<16 x i8>, <2 x i32>, i32, i32, i32, i32, i32, i32, i32) #0
Michel Danzer13736222014-01-27 07:20:51 +000047
48declare void @llvm.SI.export(i32, i32, i32, i32, i32, float, float, float, float)
49
Nicolai Haehnledf3a20c2016-04-06 19:40:20 +000050attributes #0 = { nounwind readonly }
Michel Danzer13736222014-01-27 07:20:51 +000051
Sanjoy Das3336f682016-12-11 20:07:15 +000052!0 = !{!"const", !1, i32 1}
53!1 = !{!"tbaa root"}