blob: 76f533d06391beb93295dfacc449ac4dcc855d47 [file] [log] [blame]
Anastasia Stulova0df4ac32016-11-14 17:39:58 +00001// RUN: %clang_cc1 %s -cl-std=CL2.0 -ffake-address-space-map -O0 -emit-llvm -o - -triple "spir-unknown-unknown" | FileCheck %s --check-prefix=COMMON --check-prefix=B32
2// RUN: %clang_cc1 %s -cl-std=CL2.0 -ffake-address-space-map -O0 -emit-llvm -o - -triple "spir64-unknown-unknown" | FileCheck %s --check-prefix=COMMON --check-prefix=B64
Scott Linderf8b3df42018-08-07 15:52:49 +00003// RUN: %clang_cc1 %s -cl-std=CL2.0 -ffake-address-space-map -O1 -emit-llvm -o - -triple "spir64-unknown-unknown" | FileCheck %s --check-prefix=CHECK-LIFETIMES
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +00004
Joey Gouly84ae3362017-07-31 15:15:59 +00005#pragma OPENCL EXTENSION cl_khr_subgroups : enable
6
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +00007typedef void (^bl_t)(local void *);
Anastasia Stulova58984e72017-02-16 12:27:47 +00008typedef struct {int a;} ndrange_t;
9
Sven van Haastregtda3b6322018-10-02 13:02:24 +000010// COMMON: %struct.__opencl_block_literal_generic = type { i32, i32, i8 addrspace(4)* }
11
Yaxun Liuc2a87a02017-10-14 12:23:50 +000012// For a block global variable, first emit the block literal as a global variable, then emit the block variable itself.
Sven van Haastregtda3b6322018-10-02 13:02:24 +000013// COMMON: [[BL_GLOBAL:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*, i8 addrspace(3)*)* [[INV_G:@[^ ]+]] to i8*) to i8 addrspace(4)*) }
14// COMMON: @block_G = addrspace(1) constant void (i8 addrspace(3)*) addrspace(4)* addrspacecast (void (i8 addrspace(3)*) addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BL_GLOBAL]] to void (i8 addrspace(3)*) addrspace(1)*) to void (i8 addrspace(3)*) addrspace(4)*)
Yaxun Liuc2a87a02017-10-14 12:23:50 +000015
16// For anonymous blocks without captures, emit block literals as global variable.
Sven van Haastregtda3b6322018-10-02 13:02:24 +000017// COMMON: [[BLG1:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*, i8 addrspace(3)*)* {{@[^ ]+}} to i8*) to i8 addrspace(4)*) }
18// COMMON: [[BLG2:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*, i8 addrspace(3)*)* {{@[^ ]+}} to i8*) to i8 addrspace(4)*) }
19// COMMON: [[BLG3:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*, i8 addrspace(3)*)* {{@[^ ]+}} to i8*) to i8 addrspace(4)*) }
20// COMMON: [[BLG4:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*, i8 addrspace(3)*)* {{@[^ ]+}} to i8*) to i8 addrspace(4)*) }
21// COMMON: [[BLG5:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*, i8 addrspace(3)*)* {{@[^ ]+}} to i8*) to i8 addrspace(4)*) }
22// COMMON: [[BLG6:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*, i8 addrspace(3)*, i8 addrspace(3)*, i8 addrspace(3)*)* {{@[^ ]+}} to i8*) to i8 addrspace(4)*) }
23// COMMON: [[BLG7:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*, i8 addrspace(3)*)* {{@[^ ]+}} to i8*) to i8 addrspace(4)*) }
24// COMMON: [[BLG8:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*)* [[INVG8:@[^ ]+]] to i8*) to i8 addrspace(4)*) }
25// COMMON: [[BLG9:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*, i8 addrspace(3)*)* [[INVG9:@[^ ]+]] to i8*) to i8 addrspace(4)*) }
26// COMMON: [[BLG10:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*)* {{@[^ ]+}} to i8*) to i8 addrspace(4)*) }
27// COMMON: [[BLG11:@__block_literal_global[^ ]*]] = internal addrspace(1) constant { i32, i32, i8 addrspace(4)* } { i32 {{[0-9]+}}, i32 {{[0-9]+}}, i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*)* {{@[^ ]+}} to i8*) to i8 addrspace(4)*) }
Yaxun Liuc2a87a02017-10-14 12:23:50 +000028
29// Emits block literal [[BL_GLOBAL]], invoke function [[INV_G]] and global block variable @block_G
Sven van Haastregtda3b6322018-10-02 13:02:24 +000030// COMMON: define internal spir_func void [[INV_G]](i8 addrspace(4)* %{{.*}}, i8 addrspace(3)* %{{.*}})
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +000031const bl_t block_G = (bl_t) ^ (local void *a) {};
32
Yaxun Liufa13d012018-02-15 16:39:19 +000033void callee(int id, __global int *out) {
34 out[id] = id;
35}
36
Yaxun Liuc2a87a02017-10-14 12:23:50 +000037// COMMON-LABEL: define spir_kernel void @device_side_enqueue(i32 addrspace(1)* %{{.*}}, i32 addrspace(1)* %b, i32 %i)
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +000038kernel void device_side_enqueue(global int *a, global int *b, int i) {
Anastasia Stulova0df4ac32016-11-14 17:39:58 +000039 // COMMON: %default_queue = alloca %opencl.queue_t*
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +000040 queue_t default_queue;
Anastasia Stulova0df4ac32016-11-14 17:39:58 +000041 // COMMON: %flags = alloca i32
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +000042 unsigned flags = 0;
Anastasia Stulova58984e72017-02-16 12:27:47 +000043 // COMMON: %ndrange = alloca %struct.ndrange_t
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +000044 ndrange_t ndrange;
Anastasia Stulova0df4ac32016-11-14 17:39:58 +000045 // COMMON: %clk_event = alloca %opencl.clk_event_t*
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +000046 clk_event_t clk_event;
Anastasia Stulova0df4ac32016-11-14 17:39:58 +000047 // COMMON: %event_wait_list = alloca %opencl.clk_event_t*
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +000048 clk_event_t event_wait_list;
Anastasia Stulova0df4ac32016-11-14 17:39:58 +000049 // COMMON: %event_wait_list2 = alloca [1 x %opencl.clk_event_t*]
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +000050 clk_event_t event_wait_list2[] = {clk_event};
51
Vlad Tsyrklevichc7d3d342018-08-03 17:47:58 +000052 // COMMON: [[NDR:%[a-z0-9]+]] = alloca %struct.ndrange_t, align 4
Scott Linderf8b3df42018-08-07 15:52:49 +000053
54 // B32: %[[BLOCK_SIZES1:.*]] = alloca [1 x i32]
55 // B64: %[[BLOCK_SIZES1:.*]] = alloca [1 x i64]
56 // CHECK-LIFETIMES: %[[BLOCK_SIZES1:.*]] = alloca [1 x i64]
57 // B32: %[[BLOCK_SIZES2:.*]] = alloca [1 x i32]
58 // B64: %[[BLOCK_SIZES2:.*]] = alloca [1 x i64]
59 // CHECK-LIFETIMES: %[[BLOCK_SIZES2:.*]] = alloca [1 x i64]
60 // B32: %[[BLOCK_SIZES3:.*]] = alloca [1 x i32]
61 // B64: %[[BLOCK_SIZES3:.*]] = alloca [1 x i64]
62 // CHECK-LIFETIMES: %[[BLOCK_SIZES3:.*]] = alloca [1 x i64]
63 // B32: %[[BLOCK_SIZES4:.*]] = alloca [1 x i32]
64 // B64: %[[BLOCK_SIZES4:.*]] = alloca [1 x i64]
65 // CHECK-LIFETIMES: %[[BLOCK_SIZES4:.*]] = alloca [1 x i64]
66 // B32: %[[BLOCK_SIZES5:.*]] = alloca [1 x i32]
67 // B64: %[[BLOCK_SIZES5:.*]] = alloca [1 x i64]
68 // CHECK-LIFETIMES: %[[BLOCK_SIZES5:.*]] = alloca [1 x i64]
69 // B32: %[[BLOCK_SIZES6:.*]] = alloca [3 x i32]
70 // B64: %[[BLOCK_SIZES6:.*]] = alloca [3 x i64]
71 // CHECK-LIFETIMES: %[[BLOCK_SIZES6:.*]] = alloca [3 x i64]
72 // B32: %[[BLOCK_SIZES7:.*]] = alloca [1 x i32]
73 // B64: %[[BLOCK_SIZES7:.*]] = alloca [1 x i64]
74 // CHECK-LIFETIMES: %[[BLOCK_SIZES7:.*]] = alloca [1 x i64]
75
76 // Emits block literal on stack and block kernel [[INVLK1]].
Anastasia Stulova0df4ac32016-11-14 17:39:58 +000077 // COMMON: [[DEF_Q:%[0-9]+]] = load %opencl.queue_t{{.*}}*, %opencl.queue_t{{.*}}** %default_queue
78 // COMMON: [[FLAGS:%[0-9]+]] = load i32, i32* %flags
Sven van Haastregtda3b6322018-10-02 13:02:24 +000079 // COMMON: store i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*)* [[INVL1:@__device_side_enqueue_block_invoke[^ ]*]] to i8*) to i8 addrspace(4)*), i8 addrspace(4)** %block.invoke
80 // B32: [[BL:%[0-9]+]] = bitcast <{ i32, i32, i8 addrspace(4)*, i32 addrspace(1)*, i32, i32 addrspace(1)* }>* %block to void ()*
81 // B64: [[BL:%[0-9]+]] = bitcast <{ i32, i32, i8 addrspace(4)*, i32 addrspace(1)*, i32 addrspace(1)*, i32 }>* %block to void ()*
Anastasia Stulovaaf0a7bb2017-01-27 15:11:34 +000082 // COMMON: [[BL_I8:%[0-9]+]] = addrspacecast void ()* [[BL]] to i8 addrspace(4)*
Yaxun Liuc2a87a02017-10-14 12:23:50 +000083 // COMMON-LABEL: call i32 @__enqueue_kernel_basic(
84 // COMMON-SAME: %opencl.queue_t{{.*}}* [[DEF_Q]], i32 [[FLAGS]], %struct.ndrange_t* byval [[NDR]]{{([0-9]+)?}},
85 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVLK1:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
86 // COMMON-SAME: i8 addrspace(4)* [[BL_I8]])
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +000087 enqueue_kernel(default_queue, flags, ndrange,
88 ^(void) {
89 a[i] = b[i];
90 });
91
Yaxun Liuc2a87a02017-10-14 12:23:50 +000092 // Emits block literal on stack and block kernel [[INVLK2]].
Anastasia Stulova0df4ac32016-11-14 17:39:58 +000093 // COMMON: [[DEF_Q:%[0-9]+]] = load %opencl.queue_t{{.*}}*, %opencl.queue_t{{.*}}** %default_queue
94 // COMMON: [[FLAGS:%[0-9]+]] = load i32, i32* %flags
Anastasia Stulova0df4ac32016-11-14 17:39:58 +000095 // COMMON: [[WAIT_EVNT:%[0-9]+]] = addrspacecast %opencl.clk_event_t{{.*}}** %event_wait_list to %opencl.clk_event_t{{.*}}* addrspace(4)*
96 // COMMON: [[EVNT:%[0-9]+]] = addrspacecast %opencl.clk_event_t{{.*}}** %clk_event to %opencl.clk_event_t{{.*}}* addrspace(4)*
Sven van Haastregtda3b6322018-10-02 13:02:24 +000097 // COMMON: store i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*)* [[INVL2:@__device_side_enqueue_block_invoke[^ ]*]] to i8*) to i8 addrspace(4)*), i8 addrspace(4)** %block.invoke
98 // COMMON: [[BL:%[0-9]+]] = bitcast <{ i32, i32, i8 addrspace(4)*, i32{{.*}}, i32{{.*}}, i32{{.*}} }>* %block3 to void ()*
Anastasia Stulovaaf0a7bb2017-01-27 15:11:34 +000099 // COMMON: [[BL_I8:%[0-9]+]] = addrspacecast void ()* [[BL]] to i8 addrspace(4)*
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000100 // COMMON-LABEL: call i32 @__enqueue_kernel_basic_events
101 // COMMON-SAME: (%opencl.queue_t{{.*}}* [[DEF_Q]], i32 [[FLAGS]], %struct.ndrange_t* {{.*}}, i32 2, %opencl.clk_event_t{{.*}}* addrspace(4)* [[WAIT_EVNT]], %opencl.clk_event_t{{.*}}* addrspace(4)* [[EVNT]],
102 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVLK2:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
103 // COMMON-SAME: i8 addrspace(4)* [[BL_I8]])
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000104 enqueue_kernel(default_queue, flags, ndrange, 2, &event_wait_list, &clk_event,
105 ^(void) {
106 a[i] = b[i];
107 });
108
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000109 // Emits global block literal [[BLG1]] and block kernel [[INVGK1]].
Anastasia Stulova0df4ac32016-11-14 17:39:58 +0000110 // COMMON: [[DEF_Q:%[0-9]+]] = load %opencl.queue_t{{.*}}*, %opencl.queue_t{{.*}}** %default_queue
111 // COMMON: [[FLAGS:%[0-9]+]] = load i32, i32* %flags
Scott Linderf8b3df42018-08-07 15:52:49 +0000112 // CHECK-LIFETIMES: [[LIFETIME_PTR:%[0-9]+]] = bitcast [1 x i64]* %[[BLOCK_SIZES1]] to i8*
113 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.start.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
114 // CHECK-LIFETIMES-NEXT: getelementptr inbounds [1 x i64], [1 x i64]* %[[BLOCK_SIZES1]], i64 0, i64 0
115 // CHECK-LIFETIMES-LABEL: call i32 @__enqueue_kernel_varargs(
116 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.end.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
117 // B32: %[[TMP:.*]] = getelementptr [1 x i32], [1 x i32]* %[[BLOCK_SIZES1]], i32 0, i32 0
118 // B32: store i32 256, i32* %[[TMP]], align 4
119 // B64: %[[TMP:.*]] = getelementptr [1 x i64], [1 x i64]* %[[BLOCK_SIZES1]], i32 0, i32 0
120 // B64: store i64 256, i64* %[[TMP]], align 8
Yaxun Liu3cab24a2018-05-09 17:07:06 +0000121 // COMMON-LABEL: call i32 @__enqueue_kernel_varargs(
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000122 // COMMON-SAME: %opencl.queue_t{{.*}}* [[DEF_Q]], i32 [[FLAGS]], %struct.ndrange_t* [[NDR]]{{([0-9]+)?}},
123 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK1:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000124 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG1]] to i8 addrspace(1)*) to i8 addrspace(4)*), i32 1,
Scott Linderf8b3df42018-08-07 15:52:49 +0000125 // B32-SAME: i32* %[[TMP]])
126 // B64-SAME: i64* %[[TMP]])
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000127 enqueue_kernel(default_queue, flags, ndrange,
128 ^(local void *p) {
129 return;
130 },
131 256);
Scott Linderf8b3df42018-08-07 15:52:49 +0000132
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000133 char c;
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000134 // Emits global block literal [[BLG2]] and block kernel [[INVGK2]].
Anastasia Stulova0df4ac32016-11-14 17:39:58 +0000135 // COMMON: [[DEF_Q:%[0-9]+]] = load %opencl.queue_t{{.*}}*, %opencl.queue_t{{.*}}** %default_queue
136 // COMMON: [[FLAGS:%[0-9]+]] = load i32, i32* %flags
Scott Linderf8b3df42018-08-07 15:52:49 +0000137 // CHECK-LIFETIMES: [[LIFETIME_PTR:%[0-9]+]] = bitcast [1 x i64]* %[[BLOCK_SIZES2]] to i8*
138 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.start.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
139 // CHECK-LIFETIMES-NEXT: getelementptr inbounds [1 x i64], [1 x i64]* %[[BLOCK_SIZES2]], i64 0, i64 0
140 // CHECK-LIFETIMES-LABEL: call i32 @__enqueue_kernel_varargs(
141 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.end.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
142 // B32: %[[TMP:.*]] = getelementptr [1 x i32], [1 x i32]* %[[BLOCK_SIZES2]], i32 0, i32 0
143 // B32: store i32 %{{.*}}, i32* %[[TMP]], align 4
144 // B64: %[[TMP:.*]] = getelementptr [1 x i64], [1 x i64]* %[[BLOCK_SIZES2]], i32 0, i32 0
145 // B64: store i64 %{{.*}}, i64* %[[TMP]], align 8
Yaxun Liu3cab24a2018-05-09 17:07:06 +0000146 // COMMON-LABEL: call i32 @__enqueue_kernel_varargs(
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000147 // COMMON-SAME: %opencl.queue_t{{.*}}* [[DEF_Q]], i32 [[FLAGS]], %struct.ndrange_t* [[NDR]]{{([0-9]+)?}},
148 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK2:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000149 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG2]] to i8 addrspace(1)*) to i8 addrspace(4)*), i32 1,
Scott Linderf8b3df42018-08-07 15:52:49 +0000150 // B32-SAME: i32* %[[TMP]])
151 // B64-SAME: i64* %[[TMP]])
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000152 enqueue_kernel(default_queue, flags, ndrange,
153 ^(local void *p) {
154 return;
155 },
156 c);
157
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000158 // Emits global block literal [[BLG3]] and block kernel [[INVGK3]].
Anastasia Stulova0df4ac32016-11-14 17:39:58 +0000159 // COMMON: [[DEF_Q:%[0-9]+]] = load %opencl.queue_t{{.*}}*, %opencl.queue_t{{.*}}** %default_queue
160 // COMMON: [[FLAGS:%[0-9]+]] = load i32, i32* %flags
Anastasia Stulova0df4ac32016-11-14 17:39:58 +0000161 // COMMON: [[AD:%arraydecay[0-9]*]] = getelementptr inbounds [1 x %opencl.clk_event_t*], [1 x %opencl.clk_event_t*]* %event_wait_list2, i32 0, i32 0
162 // COMMON: [[WAIT_EVNT:%[0-9]+]] = addrspacecast %opencl.clk_event_t{{.*}}** [[AD]] to %opencl.clk_event_t{{.*}}* addrspace(4)*
163 // COMMON: [[EVNT:%[0-9]+]] = addrspacecast %opencl.clk_event_t{{.*}}** %clk_event to %opencl.clk_event_t{{.*}}* addrspace(4)*
Scott Linderf8b3df42018-08-07 15:52:49 +0000164 // CHECK-LIFETIMES: [[LIFETIME_PTR:%[0-9]+]] = bitcast [1 x i64]* %[[BLOCK_SIZES3]] to i8*
165 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.start.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
166 // CHECK-LIFETIMES-NEXT: getelementptr inbounds [1 x i64], [1 x i64]* %[[BLOCK_SIZES3]], i64 0, i64 0
167 // CHECK-LIFETIMES-LABEL: call i32 @__enqueue_kernel_events_varargs(
168 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.end.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
169 // B32: %[[TMP:.*]] = getelementptr [1 x i32], [1 x i32]* %[[BLOCK_SIZES3]], i32 0, i32 0
170 // B32: store i32 256, i32* %[[TMP]], align 4
171 // B64: %[[TMP:.*]] = getelementptr [1 x i64], [1 x i64]* %[[BLOCK_SIZES3]], i32 0, i32 0
172 // B64: store i64 256, i64* %[[TMP]], align 8
Yaxun Liu3cab24a2018-05-09 17:07:06 +0000173 // COMMON-LABEL: call i32 @__enqueue_kernel_events_varargs
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000174 // COMMON-SAME: (%opencl.queue_t{{.*}}* [[DEF_Q]], i32 [[FLAGS]], %struct.ndrange_t* {{.*}}, i32 2, %opencl.clk_event_t{{.*}} [[WAIT_EVNT]], %opencl.clk_event_t{{.*}} [[EVNT]],
175 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK3:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000176 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG3]] to i8 addrspace(1)*) to i8 addrspace(4)*), i32 1,
Scott Linderf8b3df42018-08-07 15:52:49 +0000177 // B32-SAME: i32* %[[TMP]])
178 // B64-SAME: i64* %[[TMP]])
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000179 enqueue_kernel(default_queue, flags, ndrange, 2, event_wait_list2, &clk_event,
180 ^(local void *p) {
181 return;
182 },
183 256);
184
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000185 // Emits global block literal [[BLG4]] and block kernel [[INVGK4]].
Anastasia Stulova0df4ac32016-11-14 17:39:58 +0000186 // COMMON: [[DEF_Q:%[0-9]+]] = load %opencl.queue_t{{.*}}*, %opencl.queue_t{{.*}}** %default_queue
187 // COMMON: [[FLAGS:%[0-9]+]] = load i32, i32* %flags
Anastasia Stulova0df4ac32016-11-14 17:39:58 +0000188 // COMMON: [[AD:%arraydecay[0-9]*]] = getelementptr inbounds [1 x %opencl.clk_event_t*], [1 x %opencl.clk_event_t*]* %event_wait_list2, i32 0, i32 0
189 // COMMON: [[WAIT_EVNT:%[0-9]+]] = addrspacecast %opencl.clk_event_t{{.*}}** [[AD]] to %opencl.clk_event_t{{.*}}* addrspace(4)*
190 // COMMON: [[EVNT:%[0-9]+]] = addrspacecast %opencl.clk_event_t{{.*}}** %clk_event to %opencl.clk_event_t{{.*}}* addrspace(4)*
Scott Linderf8b3df42018-08-07 15:52:49 +0000191 // CHECK-LIFETIMES: [[LIFETIME_PTR:%[0-9]+]] = bitcast [1 x i64]* %[[BLOCK_SIZES4]] to i8*
192 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.start.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
193 // CHECK-LIFETIMES-NEXT: getelementptr inbounds [1 x i64], [1 x i64]* %[[BLOCK_SIZES4]], i64 0, i64 0
194 // CHECK-LIFETIMES-LABEL: call i32 @__enqueue_kernel_events_varargs(
195 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.end.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
196 // B32: %[[TMP:.*]] = getelementptr [1 x i32], [1 x i32]* %[[BLOCK_SIZES4]], i32 0, i32 0
197 // B32: store i32 %{{.*}}, i32* %[[TMP]], align 4
198 // B64: %[[TMP:.*]] = getelementptr [1 x i64], [1 x i64]* %[[BLOCK_SIZES4]], i32 0, i32 0
199 // B64: store i64 %{{.*}}, i64* %[[TMP]], align 8
Yaxun Liu3cab24a2018-05-09 17:07:06 +0000200 // COMMON-LABEL: call i32 @__enqueue_kernel_events_varargs
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000201 // COMMON-SAME: (%opencl.queue_t{{.*}}* [[DEF_Q]], i32 [[FLAGS]], %struct.ndrange_t* {{.*}}, i32 2, %opencl.clk_event_t{{.*}}* addrspace(4)* [[WAIT_EVNT]], %opencl.clk_event_t{{.*}}* addrspace(4)* [[EVNT]],
202 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK4:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000203 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG4]] to i8 addrspace(1)*) to i8 addrspace(4)*), i32 1,
Scott Linderf8b3df42018-08-07 15:52:49 +0000204 // B32-SAME: i32* %[[TMP]])
205 // B64-SAME: i64* %[[TMP]])
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000206 enqueue_kernel(default_queue, flags, ndrange, 2, event_wait_list2, &clk_event,
207 ^(local void *p) {
208 return;
209 },
210 c);
211
Anastasia Stulova0df4ac32016-11-14 17:39:58 +0000212 long l;
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000213 // Emits global block literal [[BLG5]] and block kernel [[INVGK5]].
Anastasia Stulova0df4ac32016-11-14 17:39:58 +0000214 // COMMON: [[DEF_Q:%[0-9]+]] = load %opencl.queue_t{{.*}}*, %opencl.queue_t{{.*}}** %default_queue
215 // COMMON: [[FLAGS:%[0-9]+]] = load i32, i32* %flags
Scott Linderf8b3df42018-08-07 15:52:49 +0000216 // CHECK-LIFETIMES: [[LIFETIME_PTR:%[0-9]+]] = bitcast [1 x i64]* %[[BLOCK_SIZES5]] to i8*
217 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.start.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
218 // CHECK-LIFETIMES-NEXT: getelementptr inbounds [1 x i64], [1 x i64]* %[[BLOCK_SIZES5]], i64 0, i64 0
219 // CHECK-LIFETIMES-LABEL: call i32 @__enqueue_kernel_varargs(
220 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.end.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
221 // B32: %[[TMP:.*]] = getelementptr [1 x i32], [1 x i32]* %[[BLOCK_SIZES5]], i32 0, i32 0
222 // B32: store i32 %{{.*}}, i32* %[[TMP]], align 4
223 // B64: %[[TMP:.*]] = getelementptr [1 x i64], [1 x i64]* %[[BLOCK_SIZES5]], i32 0, i32 0
224 // B64: store i64 %{{.*}}, i64* %[[TMP]], align 8
Yaxun Liu3cab24a2018-05-09 17:07:06 +0000225 // COMMON-LABEL: call i32 @__enqueue_kernel_varargs
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000226 // COMMON-SAME: (%opencl.queue_t{{.*}}* [[DEF_Q]], i32 [[FLAGS]], %struct.ndrange_t* [[NDR]]{{([0-9]+)?}},
227 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK5:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000228 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG5]] to i8 addrspace(1)*) to i8 addrspace(4)*), i32 1,
Scott Linderf8b3df42018-08-07 15:52:49 +0000229 // B32-SAME: i32* %[[TMP]])
230 // B64-SAME: i64* %[[TMP]])
Anastasia Stulova0df4ac32016-11-14 17:39:58 +0000231 enqueue_kernel(default_queue, flags, ndrange,
232 ^(local void *p) {
233 return;
234 },
235 l);
236
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000237 // Emits global block literal [[BLG6]] and block kernel [[INVGK6]].
Yaxun Liu29a5ee32017-09-03 13:52:24 +0000238 // COMMON: [[DEF_Q:%[0-9]+]] = load %opencl.queue_t{{.*}}*, %opencl.queue_t{{.*}}** %default_queue
239 // COMMON: [[FLAGS:%[0-9]+]] = load i32, i32* %flags
Scott Linderf8b3df42018-08-07 15:52:49 +0000240 // CHECK-LIFETIMES: [[LIFETIME_PTR:%[0-9]+]] = bitcast [3 x i64]* %[[BLOCK_SIZES6]] to i8*
241 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.start.p0i8(i64 24, i8* nonnull [[LIFETIME_PTR]])
242 // CHECK-LIFETIMES-NEXT: getelementptr inbounds [3 x i64], [3 x i64]* %[[BLOCK_SIZES6]], i64 0, i64 0
243 // CHECK-LIFETIMES-LABEL: call i32 @__enqueue_kernel_varargs(
244 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.end.p0i8(i64 24, i8* nonnull [[LIFETIME_PTR]])
245 // B32: %[[TMP:.*]] = getelementptr [3 x i32], [3 x i32]* %[[BLOCK_SIZES6]], i32 0, i32 0
246 // B32: store i32 1, i32* %[[TMP]], align 4
247 // B32: %[[BLOCK_SIZES62:.*]] = getelementptr [3 x i32], [3 x i32]* %[[BLOCK_SIZES6]], i32 0, i32 1
248 // B32: store i32 2, i32* %[[BLOCK_SIZES62]], align 4
249 // B32: %[[BLOCK_SIZES63:.*]] = getelementptr [3 x i32], [3 x i32]* %[[BLOCK_SIZES6]], i32 0, i32 2
250 // B32: store i32 4, i32* %[[BLOCK_SIZES63]], align 4
251 // B64: %[[TMP:.*]] = getelementptr [3 x i64], [3 x i64]* %[[BLOCK_SIZES6]], i32 0, i32 0
252 // B64: store i64 1, i64* %[[TMP]], align 8
253 // B64: %[[BLOCK_SIZES62:.*]] = getelementptr [3 x i64], [3 x i64]* %[[BLOCK_SIZES6]], i32 0, i32 1
254 // B64: store i64 2, i64* %[[BLOCK_SIZES62]], align 8
255 // B64: %[[BLOCK_SIZES63:.*]] = getelementptr [3 x i64], [3 x i64]* %[[BLOCK_SIZES6]], i32 0, i32 2
256 // B64: store i64 4, i64* %[[BLOCK_SIZES63]], align 8
Yaxun Liu3cab24a2018-05-09 17:07:06 +0000257 // COMMON-LABEL: call i32 @__enqueue_kernel_varargs
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000258 // COMMON-SAME: (%opencl.queue_t{{.*}}* [[DEF_Q]], i32 [[FLAGS]], %struct.ndrange_t* [[NDR]]{{([0-9]+)?}},
259 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK6:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000260 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG6]] to i8 addrspace(1)*) to i8 addrspace(4)*), i32 3,
Scott Linderf8b3df42018-08-07 15:52:49 +0000261 // B32-SAME: i32* %[[TMP]])
262 // B64-SAME: i64* %[[TMP]])
Yaxun Liu29a5ee32017-09-03 13:52:24 +0000263 enqueue_kernel(default_queue, flags, ndrange,
264 ^(local void *p1, local void *p2, local void *p3) {
265 return;
266 },
267 1, 2, 4);
268
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000269 // Emits global block literal [[BLG7]] and block kernel [[INVGK7]].
Anastasia Stulova0df4ac32016-11-14 17:39:58 +0000270 // COMMON: [[DEF_Q:%[0-9]+]] = load %opencl.queue_t*, %opencl.queue_t** %default_queue
271 // COMMON: [[FLAGS:%[0-9]+]] = load i32, i32* %flags
Scott Linderf8b3df42018-08-07 15:52:49 +0000272 // CHECK-LIFETIMES: [[LIFETIME_PTR:%[0-9]+]] = bitcast [1 x i64]* %[[BLOCK_SIZES7]] to i8*
273 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.start.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
274 // CHECK-LIFETIMES-NEXT: getelementptr inbounds [1 x i64], [1 x i64]* %[[BLOCK_SIZES7]], i64 0, i64 0
275 // CHECK-LIFETIMES-LABEL: call i32 @__enqueue_kernel_varargs(
276 // CHECK-LIFETIMES-NEXT: call void @llvm.lifetime.end.p0i8(i64 8, i8* nonnull [[LIFETIME_PTR]])
277 // B32: %[[TMP:.*]] = getelementptr [1 x i32], [1 x i32]* %[[BLOCK_SIZES7]], i32 0, i32 0
278 // B32: store i32 0, i32* %[[TMP]], align 4
279 // B64: %[[TMP:.*]] = getelementptr [1 x i64], [1 x i64]* %[[BLOCK_SIZES7]], i32 0, i32 0
280 // B64: store i64 4294967296, i64* %[[TMP]], align 8
Yaxun Liu3cab24a2018-05-09 17:07:06 +0000281 // COMMON-LABEL: call i32 @__enqueue_kernel_varargs
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000282 // COMMON-SAME: (%opencl.queue_t{{.*}}* [[DEF_Q]], i32 [[FLAGS]], %struct.ndrange_t* [[NDR]]{{([0-9]+)?}},
283 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK7:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000284 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG7]] to i8 addrspace(1)*) to i8 addrspace(4)*), i32 1,
Scott Linderf8b3df42018-08-07 15:52:49 +0000285 // B32-SAME: i32* %[[TMP]])
286 // B64-SAME: i64* %[[TMP]])
Anastasia Stulova0df4ac32016-11-14 17:39:58 +0000287 enqueue_kernel(default_queue, flags, ndrange,
288 ^(local void *p) {
289 return;
290 },
291 4294967296L);
292
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000293 // Emits global block literal [[BLG8]] and invoke function [[INVG8]].
George Burgess IVe3763372016-12-22 02:50:20 +0000294 // The full type of these expressions are long (and repeated elsewhere), so we
295 // capture it as part of the regex for convenience and clarity.
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000296 // COMMON: store void () addrspace(4)* addrspacecast (void () addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG8]] to void () addrspace(1)*) to void () addrspace(4)*), void () addrspace(4)** %block_A
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000297 void (^const block_A)(void) = ^{
298 return;
299 };
George Burgess IVe3763372016-12-22 02:50:20 +0000300
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000301 // Emits global block literal [[BLG9]] and invoke function [[INVG9]].
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000302 // COMMON: store void (i8 addrspace(3)*) addrspace(4)* addrspacecast (void (i8 addrspace(3)*) addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG9]] to void (i8 addrspace(3)*) addrspace(1)*) to void (i8 addrspace(3)*) addrspace(4)*), void (i8 addrspace(3)*) addrspace(4)** %block_B
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000303 void (^const block_B)(local void *) = ^(local void *a) {
304 return;
305 };
306
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000307 // Uses global block literal [[BLG8]] and invoke function [[INVG8]].
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000308 // COMMON: [[r1:%.*]] = load i8 addrspace(4)*, i8 addrspace(4)* addrspace(4)* getelementptr inbounds (%struct.__opencl_block_literal_generic, %struct.__opencl_block_literal_generic addrspace(4)* addrspacecast (%struct.__opencl_block_literal_generic addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG8]] to %struct.__opencl_block_literal_generic addrspace(1)*) to %struct.__opencl_block_literal_generic addrspace(4)*), i32 0, i32 2)
309 // COMMON: [[r2:%.*]] = addrspacecast i8 addrspace(4)* [[r1]] to void (i8 addrspace(4)*)*
310 // COMMON: call spir_func void [[r2]](i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG8]] to i8 addrspace(1)*) to i8 addrspace(4)*))
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000311 block_A();
312
313 // Emits global block literal [[BLG8]] and block kernel [[INVGK8]]. [[INVGK8]] calls [[INVG8]].
314 // COMMON: [[DEF_Q:%[0-9]+]] = load %opencl.queue_t{{.*}}*, %opencl.queue_t{{.*}}** %default_queue
315 // COMMON: [[FLAGS:%[0-9]+]] = load i32, i32* %flags
316 // COMMON-LABEL: call i32 @__enqueue_kernel_basic(
317 // COMMON-SAME: %opencl.queue_t{{.*}}* [[DEF_Q]], i32 [[FLAGS]], %struct.ndrange_t* byval [[NDR]]{{([0-9]+)?}},
318 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK8:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000319 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG8]] to i8 addrspace(1)*) to i8 addrspace(4)*))
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000320 enqueue_kernel(default_queue, flags, ndrange, block_A);
321
322 // Uses block kernel [[INVGK8]] and global block literal [[BLG8]].
323 // COMMON: call i32 @__get_kernel_work_group_size_impl(
324 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK8]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000325 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG8]] to i8 addrspace(1)*) to i8 addrspace(4)*))
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000326 unsigned size = get_kernel_work_group_size(block_A);
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000327
328 // Uses global block literal [[BLG8]] and invoke function [[INVG8]]. Make sure no redundant block literal and invoke functions are emitted.
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000329 // COMMON: [[r1:%.*]] = load i8 addrspace(4)*, i8 addrspace(4)* addrspace(4)* getelementptr inbounds (%struct.__opencl_block_literal_generic, %struct.__opencl_block_literal_generic addrspace(4)* addrspacecast (%struct.__opencl_block_literal_generic addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG8]] to %struct.__opencl_block_literal_generic addrspace(1)*) to %struct.__opencl_block_literal_generic addrspace(4)*), i32 0, i32 2)
330 // COMMON: [[r2:%.*]] = addrspacecast i8 addrspace(4)* [[r1]] to void (i8 addrspace(4)*)*
331 // COMMON: call spir_func void [[r2]](i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG8]] to i8 addrspace(1)*) to i8 addrspace(4)*))
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000332 block_A();
333
Yaxun Liufa13d012018-02-15 16:39:19 +0000334 void (^block_C)(void) = ^{
335 callee(i, a);
336 };
337
338 // Emits block literal on stack and block kernel [[INVLK3]].
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000339 // COMMON: store i8 addrspace(4)* addrspacecast (i8* bitcast (void (i8 addrspace(4)*)* [[INVL3:@__device_side_enqueue_block_invoke[^ ]*]] to i8*) to i8 addrspace(4)*), i8 addrspace(4)** %block.invoke
Yaxun Liufa13d012018-02-15 16:39:19 +0000340 // COMMON: [[DEF_Q:%[0-9]+]] = load %opencl.queue_t{{.*}}*, %opencl.queue_t{{.*}}** %default_queue
341 // COMMON: [[FLAGS:%[0-9]+]] = load i32, i32* %flags
342 // COMMON: [[BL_I8:%[0-9]+]] = addrspacecast void ()* {{.*}} to i8 addrspace(4)*
343 // COMMON-LABEL: call i32 @__enqueue_kernel_basic(
344 // COMMON-SAME: %opencl.queue_t{{.*}}* [[DEF_Q]], i32 [[FLAGS]], %struct.ndrange_t* byval [[NDR]]{{([0-9]+)?}},
345 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVLK3:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
346 // COMMON-SAME: i8 addrspace(4)* [[BL_I8]])
347 enqueue_kernel(default_queue, flags, ndrange, block_C);
348
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000349 // Emits global block literal [[BLG9]] and block kernel [[INVGK9]]. [[INVGK9]] calls [[INV9]].
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000350 // COMMON: call i32 @__get_kernel_work_group_size_impl(
351 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK9:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000352 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG9]] to i8 addrspace(1)*) to i8 addrspace(4)*))
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000353 size = get_kernel_work_group_size(block_B);
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000354
355 // Uses global block literal [[BLG8]] and block kernel [[INVGK8]]. Make sure no redundant block literal ind invoke functions are emitted.
Yaxun Liu3cab24a2018-05-09 17:07:06 +0000356 // COMMON: call i32 @__get_kernel_preferred_work_group_size_multiple_impl(
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000357 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK8]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000358 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG8]] to i8 addrspace(1)*) to i8 addrspace(4)*))
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000359 size = get_kernel_preferred_work_group_size_multiple(block_A);
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000360
361 // Uses global block literal [[BL_GLOBAL]] and block kernel [[INV_G_K]]. [[INV_G_K]] calls [[INV_G]].
Yaxun Liu3cab24a2018-05-09 17:07:06 +0000362 // COMMON: call i32 @__get_kernel_preferred_work_group_size_multiple_impl(
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000363 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INV_G_K:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000364 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BL_GLOBAL]] to i8 addrspace(1)*) to i8 addrspace(4)*))
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000365 size = get_kernel_preferred_work_group_size_multiple(block_G);
Joey Goulyfa76b492017-08-01 13:27:09 +0000366
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000367 // Emits global block literal [[BLG10]] and block kernel [[INVGK10]].
368 // COMMON: call i32 @__get_kernel_max_sub_group_size_for_ndrange_impl(%struct.ndrange_t* {{[^,]+}},
369 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK10:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000370 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG10]] to i8 addrspace(1)*) to i8 addrspace(4)*))
Joey Goulyfa76b492017-08-01 13:27:09 +0000371 size = get_kernel_max_sub_group_size_for_ndrange(ndrange, ^(){});
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000372
373 // Emits global block literal [[BLG11]] and block kernel [[INVGK11]].
374 // COMMON: call i32 @__get_kernel_sub_group_count_for_ndrange_impl(%struct.ndrange_t* {{[^,]+}},
375 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8* bitcast ({{.*}} [[INVGK11:[^ ]+_kernel]] to i8*) to i8 addrspace(4)*),
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000376 // COMMON-SAME: i8 addrspace(4)* addrspacecast (i8 addrspace(1)* bitcast ({ i32, i32, i8 addrspace(4)* } addrspace(1)* [[BLG11]] to i8 addrspace(1)*) to i8 addrspace(4)*))
Joey Goulyfa76b492017-08-01 13:27:09 +0000377 size = get_kernel_sub_group_count_for_ndrange(ndrange, ^(){});
Anastasia Stulovadb7a31c2016-07-05 11:31:24 +0000378}
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000379
380// COMMON: define internal spir_kernel void [[INVLK1]](i8 addrspace(4)*) #{{[0-9]+}} {
381// COMMON: entry:
382// COMMON: call void @__device_side_enqueue_block_invoke(i8 addrspace(4)* %0)
383// COMMON: ret void
384// COMMON: }
385// COMMON: define internal spir_kernel void [[INVLK2]](i8 addrspace(4)*{{.*}})
386// COMMON: define internal spir_kernel void [[INVGK1]](i8 addrspace(4)*{{.*}}, i8 addrspace(3)*{{.*}})
387// COMMON: define internal spir_kernel void [[INVGK2]](i8 addrspace(4)*{{.*}}, i8 addrspace(3)*{{.*}})
388// COMMON: define internal spir_kernel void [[INVGK3]](i8 addrspace(4)*{{.*}}, i8 addrspace(3)*{{.*}})
389// COMMON: define internal spir_kernel void [[INVGK4]](i8 addrspace(4)*{{.*}}, i8 addrspace(3)*{{.*}})
390// COMMON: define internal spir_kernel void [[INVGK5]](i8 addrspace(4)*{{.*}}, i8 addrspace(3)*{{.*}})
391// COMMON: define internal spir_kernel void [[INVGK6]](i8 addrspace(4)*, i8 addrspace(3)*, i8 addrspace(3)*, i8 addrspace(3)*) #{{[0-9]+}} {
392// COMMON: entry:
393// COMMON: call void @__device_side_enqueue_block_invoke_8(i8 addrspace(4)* %0, i8 addrspace(3)* %1, i8 addrspace(3)* %2, i8 addrspace(3)* %3)
394// COMMON: ret void
395// COMMON: }
396// COMMON: define internal spir_kernel void [[INVGK7]](i8 addrspace(4)*{{.*}}, i8 addrspace(3)*{{.*}})
397// COMMON: define internal spir_func void [[INVG8]](i8 addrspace(4)*{{.*}})
Sven van Haastregtda3b6322018-10-02 13:02:24 +0000398// COMMON: define internal spir_func void [[INVG9]](i8 addrspace(4)*{{.*}}, i8 addrspace(3)* %{{.*}})
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000399// COMMON: define internal spir_kernel void [[INVGK8]](i8 addrspace(4)*{{.*}})
Yaxun Liufa13d012018-02-15 16:39:19 +0000400// COMMON: define internal spir_kernel void [[INVLK3]](i8 addrspace(4)*{{.*}})
Yaxun Liuc2a87a02017-10-14 12:23:50 +0000401// COMMON: define internal spir_kernel void [[INVGK9]](i8 addrspace(4)*{{.*}}, i8 addrspace(3)*{{.*}})
402// COMMON: define internal spir_kernel void [[INV_G_K]](i8 addrspace(4)*{{.*}}, i8 addrspace(3)*{{.*}})
403// COMMON: define internal spir_kernel void [[INVGK10]](i8 addrspace(4)*{{.*}})
404// COMMON: define internal spir_kernel void [[INVGK11]](i8 addrspace(4)*{{.*}})