blob: bdd4fb83055791dd001e3017803c6603afc2b30e [file] [log] [blame]
Nicolai Haehnle10459282018-06-21 13:37:19 +00001; RUN: llc -march=amdgcn -mcpu=verde -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +00002; RUN: llc -march=amdgcn -mcpu=gfx900 -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +00003; RUN: llc -march=amdgcn -mcpu=gfx1010 -verify-machineinstrs -show-mc-encoding < %s | FileCheck -check-prefix=GCN %s
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +00004
5; GCN-LABEL: {{^}}atomic_swap_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +00006; GFX6789: image_atomic_swap v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
7; GFX10: image_atomic_swap v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +00008define amdgpu_ps float @atomic_swap_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
9main_body:
10 %v = call i32 @llvm.amdgcn.image.atomic.swap.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
11 %out = bitcast i32 %v to float
12 ret float %out
13}
14
15; GCN-LABEL: {{^}}atomic_add_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +000016; GFX6789: image_atomic_add v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
17; GFX10: image_atomic_add v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +000018define amdgpu_ps float @atomic_add_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
19main_body:
20 %v = call i32 @llvm.amdgcn.image.atomic.add.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
21 %out = bitcast i32 %v to float
22 ret float %out
23}
24
25; GCN-LABEL: {{^}}atomic_sub_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +000026; GFX6789: image_atomic_sub v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
27; GFX10: image_atomic_sub v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +000028define amdgpu_ps float @atomic_sub_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
29main_body:
30 %v = call i32 @llvm.amdgcn.image.atomic.sub.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
31 %out = bitcast i32 %v to float
32 ret float %out
33}
34
35; GCN-LABEL: {{^}}atomic_smin_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +000036; GFX6789: image_atomic_smin v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
37; GFX10: image_atomic_smin v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +000038define amdgpu_ps float @atomic_smin_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
39main_body:
40 %v = call i32 @llvm.amdgcn.image.atomic.smin.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
41 %out = bitcast i32 %v to float
42 ret float %out
43}
44
45; GCN-LABEL: {{^}}atomic_umin_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +000046; GFX6789: image_atomic_umin v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
47; GFX10: image_atomic_umin v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +000048define amdgpu_ps float @atomic_umin_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
49main_body:
50 %v = call i32 @llvm.amdgcn.image.atomic.umin.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
51 %out = bitcast i32 %v to float
52 ret float %out
53}
54
55; GCN-LABEL: {{^}}atomic_smax_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +000056; GFX6789: image_atomic_smax v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
57; GFX10: image_atomic_smax v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +000058define amdgpu_ps float @atomic_smax_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
59main_body:
60 %v = call i32 @llvm.amdgcn.image.atomic.smax.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
61 %out = bitcast i32 %v to float
62 ret float %out
63}
64
65; GCN-LABEL: {{^}}atomic_umax_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +000066; GFX6789: image_atomic_umax v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
67; GFX10: image_atomic_umax v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +000068define amdgpu_ps float @atomic_umax_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
69main_body:
70 %v = call i32 @llvm.amdgcn.image.atomic.umax.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
71 %out = bitcast i32 %v to float
72 ret float %out
73}
74
75; GCN-LABEL: {{^}}atomic_and_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +000076; GFX6789: image_atomic_and v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
77; GFX10: image_atomic_and v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +000078define amdgpu_ps float @atomic_and_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
79main_body:
80 %v = call i32 @llvm.amdgcn.image.atomic.and.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
81 %out = bitcast i32 %v to float
82 ret float %out
83}
84
85; GCN-LABEL: {{^}}atomic_or_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +000086; GFX6789: image_atomic_or v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
87; GFX10: image_atomic_or v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +000088define amdgpu_ps float @atomic_or_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
89main_body:
90 %v = call i32 @llvm.amdgcn.image.atomic.or.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
91 %out = bitcast i32 %v to float
92 ret float %out
93}
94
95; GCN-LABEL: {{^}}atomic_xor_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +000096; GFX6789: image_atomic_xor v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
97; GFX10: image_atomic_xor v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +000098define amdgpu_ps float @atomic_xor_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
99main_body:
100 %v = call i32 @llvm.amdgcn.image.atomic.xor.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
101 %out = bitcast i32 %v to float
102 ret float %out
103}
104
105; GCN-LABEL: {{^}}atomic_inc_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +0000106; GFX6789: image_atomic_inc v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
107; GFX10: image_atomic_inc v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +0000108define amdgpu_ps float @atomic_inc_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
109main_body:
110 %v = call i32 @llvm.amdgcn.image.atomic.inc.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
111 %out = bitcast i32 %v to float
112 ret float %out
113}
114
115; GCN-LABEL: {{^}}atomic_dec_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +0000116; GFX6789: image_atomic_dec v0, v1, s[0:7] dmask:0x1 unorm glc{{$}}
117; GFX10: image_atomic_dec v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +0000118define amdgpu_ps float @atomic_dec_1d(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
119main_body:
120 %v = call i32 @llvm.amdgcn.image.atomic.dec.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
121 %out = bitcast i32 %v to float
122 ret float %out
123}
124
125; GCN-LABEL: {{^}}atomic_cmpswap_1d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +0000126; GFX6789: image_atomic_cmpswap v[0:1], v2, s[0:7] dmask:0x3 unorm glc{{$}}
127; GFX10: image_atomic_cmpswap v[0:1], v2, s[0:7] dmask:0x3 dim:SQ_RSRC_IMG_1D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +0000128define amdgpu_ps float @atomic_cmpswap_1d(<8 x i32> inreg %rsrc, i32 %cmp, i32 %swap, i32 %s) {
129main_body:
130 %v = call i32 @llvm.amdgcn.image.atomic.cmpswap.1d.i32.i32(i32 %cmp, i32 %swap, i32 %s, <8 x i32> %rsrc, i32 0, i32 0)
131 %out = bitcast i32 %v to float
132 ret float %out
133}
134
135; GCN-LABEL: {{^}}atomic_add_2d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +0000136; GFX6789: image_atomic_add v0, v[1:2], s[0:7] dmask:0x1 unorm glc{{$}}
137; GFX10: image_atomic_add v0, v[1:2], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +0000138define amdgpu_ps float @atomic_add_2d(<8 x i32> inreg %rsrc, i32 %data, i32 %s, i32 %t) {
139main_body:
140 %v = call i32 @llvm.amdgcn.image.atomic.add.2d.i32.i32(i32 %data, i32 %s, i32 %t, <8 x i32> %rsrc, i32 0, i32 0)
141 %out = bitcast i32 %v to float
142 ret float %out
143}
144
145; GCN-LABEL: {{^}}atomic_add_3d:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +0000146; GFX6789: image_atomic_add v0, v[1:4], s[0:7] dmask:0x1 unorm glc{{$}}
147; GFX10: image_atomic_add v0, v[1:4], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_3D unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +0000148define amdgpu_ps float @atomic_add_3d(<8 x i32> inreg %rsrc, i32 %data, i32 %s, i32 %t, i32 %r) {
149main_body:
150 %v = call i32 @llvm.amdgcn.image.atomic.add.3d.i32.i32(i32 %data, i32 %s, i32 %t, i32 %r, <8 x i32> %rsrc, i32 0, i32 0)
151 %out = bitcast i32 %v to float
152 ret float %out
153}
154
155; GCN-LABEL: {{^}}atomic_add_cube:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +0000156; GFX6789: image_atomic_add v0, v[1:4], s[0:7] dmask:0x1 unorm glc da{{$}}
157; GFX10: image_atomic_add v0, v[1:4], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_CUBE unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +0000158define amdgpu_ps float @atomic_add_cube(<8 x i32> inreg %rsrc, i32 %data, i32 %s, i32 %t, i32 %face) {
159main_body:
160 %v = call i32 @llvm.amdgcn.image.atomic.add.cube.i32.i32(i32 %data, i32 %s, i32 %t, i32 %face, <8 x i32> %rsrc, i32 0, i32 0)
161 %out = bitcast i32 %v to float
162 ret float %out
163}
164
165; GCN-LABEL: {{^}}atomic_add_1darray:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +0000166; GFX6789: image_atomic_add v0, v[1:2], s[0:7] dmask:0x1 unorm glc da{{$}}
167; GFX10: image_atomic_add v0, v[1:2], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D_ARRAY unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +0000168define amdgpu_ps float @atomic_add_1darray(<8 x i32> inreg %rsrc, i32 %data, i32 %s, i32 %slice) {
169main_body:
170 %v = call i32 @llvm.amdgcn.image.atomic.add.1darray.i32.i32(i32 %data, i32 %s, i32 %slice, <8 x i32> %rsrc, i32 0, i32 0)
171 %out = bitcast i32 %v to float
172 ret float %out
173}
174
175; GCN-LABEL: {{^}}atomic_add_2darray:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +0000176; GFX6789: image_atomic_add v0, v[1:4], s[0:7] dmask:0x1 unorm glc da{{$}}
177; GFX10: image_atomic_add v0, v[1:4], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_ARRAY unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +0000178define amdgpu_ps float @atomic_add_2darray(<8 x i32> inreg %rsrc, i32 %data, i32 %s, i32 %t, i32 %slice) {
179main_body:
180 %v = call i32 @llvm.amdgcn.image.atomic.add.2darray.i32.i32(i32 %data, i32 %s, i32 %t, i32 %slice, <8 x i32> %rsrc, i32 0, i32 0)
181 %out = bitcast i32 %v to float
182 ret float %out
183}
184
185; GCN-LABEL: {{^}}atomic_add_2dmsaa:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +0000186; GFX6789: image_atomic_add v0, v[1:4], s[0:7] dmask:0x1 unorm glc{{$}}
187; GFX10: image_atomic_add v0, v[1:4], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_MSAA unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +0000188define amdgpu_ps float @atomic_add_2dmsaa(<8 x i32> inreg %rsrc, i32 %data, i32 %s, i32 %t, i32 %fragid) {
189main_body:
190 %v = call i32 @llvm.amdgcn.image.atomic.add.2dmsaa.i32.i32(i32 %data, i32 %s, i32 %t, i32 %fragid, <8 x i32> %rsrc, i32 0, i32 0)
191 %out = bitcast i32 %v to float
192 ret float %out
193}
194
195; GCN-LABEL: {{^}}atomic_add_2darraymsaa:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +0000196; GFX6789: image_atomic_add v0, v[1:4], s[0:7] dmask:0x1 unorm glc da{{$}}
197; GFX10: image_atomic_add v0, v[1:4], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_MSAA_ARRAY unorm glc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +0000198define amdgpu_ps float @atomic_add_2darraymsaa(<8 x i32> inreg %rsrc, i32 %data, i32 %s, i32 %t, i32 %slice, i32 %fragid) {
199main_body:
200 %v = call i32 @llvm.amdgcn.image.atomic.add.2darraymsaa.i32.i32(i32 %data, i32 %s, i32 %t, i32 %slice, i32 %fragid, <8 x i32> %rsrc, i32 0, i32 0)
201 %out = bitcast i32 %v to float
202 ret float %out
203}
204
205; GCN-LABEL: {{^}}atomic_add_1d_slc:
Stanislav Mekhanoshin692560d2019-05-01 16:32:58 +0000206; GFX6789: image_atomic_add v0, v1, s[0:7] dmask:0x1 unorm glc slc{{$}}
207; GFX10: image_atomic_add v0, v1, s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_1D unorm glc slc ;
Nicolai Haehnle2f5a7382018-04-04 10:58:54 +0000208define amdgpu_ps float @atomic_add_1d_slc(<8 x i32> inreg %rsrc, i32 %data, i32 %s) {
209main_body:
210 %v = call i32 @llvm.amdgcn.image.atomic.add.1d.i32.i32(i32 %data, i32 %s, <8 x i32> %rsrc, i32 0, i32 2)
211 %out = bitcast i32 %v to float
212 ret float %out
213}
214
215declare i32 @llvm.amdgcn.image.atomic.swap.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
216declare i32 @llvm.amdgcn.image.atomic.add.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
217declare i32 @llvm.amdgcn.image.atomic.sub.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
218declare i32 @llvm.amdgcn.image.atomic.smin.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
219declare i32 @llvm.amdgcn.image.atomic.umin.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
220declare i32 @llvm.amdgcn.image.atomic.smax.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
221declare i32 @llvm.amdgcn.image.atomic.umax.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
222declare i32 @llvm.amdgcn.image.atomic.and.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
223declare i32 @llvm.amdgcn.image.atomic.or.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
224declare i32 @llvm.amdgcn.image.atomic.xor.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
225declare i32 @llvm.amdgcn.image.atomic.inc.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
226declare i32 @llvm.amdgcn.image.atomic.dec.1d.i32.i32(i32, i32, <8 x i32>, i32, i32) #0
227declare i32 @llvm.amdgcn.image.atomic.cmpswap.1d.i32.i32(i32, i32, i32, <8 x i32>, i32, i32) #0
228
229declare i32 @llvm.amdgcn.image.atomic.add.2d.i32.i32(i32, i32, i32, <8 x i32>, i32, i32) #0
230declare i32 @llvm.amdgcn.image.atomic.add.3d.i32.i32(i32, i32, i32, i32, <8 x i32>, i32, i32) #0
231declare i32 @llvm.amdgcn.image.atomic.add.cube.i32.i32(i32, i32, i32, i32, <8 x i32>, i32, i32) #0
232declare i32 @llvm.amdgcn.image.atomic.add.1darray.i32.i32(i32, i32, i32, <8 x i32>, i32, i32) #0
233declare i32 @llvm.amdgcn.image.atomic.add.2darray.i32.i32(i32, i32, i32, i32, <8 x i32>, i32, i32) #0
234declare i32 @llvm.amdgcn.image.atomic.add.2dmsaa.i32.i32(i32, i32, i32, i32, <8 x i32>, i32, i32) #0
235declare i32 @llvm.amdgcn.image.atomic.add.2darraymsaa.i32.i32(i32, i32, i32, i32, i32, <8 x i32>, i32, i32) #0
236
237attributes #0 = { nounwind }
238attributes #1 = { nounwind readonly }
239attributes #2 = { nounwind readnone }