blob: 098c8e165ff507c999701515ca3bfcc3343c7282 [file] [log] [blame]
Arpith Chacko Jacobcdda3daa2017-01-29 20:49:31 +00001// Test target codegen - host bc file has to be created first.
2// RUN: %clang_cc1 -verify -fopenmp -x c -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
3// RUN: %clang_cc1 -verify -fopenmp -x c -triple nvptx64-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - | FileCheck %s --check-prefix CHECK --check-prefix CHECK-64
4// RUN: %clang_cc1 -verify -fopenmp -x c -triple i386-unknown-unknown -fopenmp-targets=nvptx-nvidia-cuda -emit-llvm-bc %s -o %t-x86-host.bc
5// RUN: %clang_cc1 -verify -fopenmp -x c -triple nvptx-unknown-unknown -fopenmp-targets=nvptx-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o - | FileCheck %s --check-prefix CHECK --check-prefix CHECK-32
Arpith Chacko Jacobcdda3daa2017-01-29 20:49:31 +00006// expected-no-diagnostics
7extern int printf(const char *, ...);
Arpith Chacko Jacobcdda3daa2017-01-29 20:49:31 +00008
Alexey Bataevceeaa482018-11-21 21:04:34 +00009// CHECK-DAG: private unnamed_addr constant %struct.ident_t { i32 0, i32 2, i32 2, i32 0, i8* getelementptr inbounds
10
Arpith Chacko Jacobcdda3daa2017-01-29 20:49:31 +000011// Check a simple call to printf end-to-end.
Alexey Bataevceeaa482018-11-21 21:04:34 +000012// CHECK-DAG: [[SIMPLE_PRINTF_TY:%[a-zA-Z0-9_]+]] = type { i32, i64, double }
Arpith Chacko Jacobcdda3daa2017-01-29 20:49:31 +000013int CheckSimple() {
14 // CHECK: define {{.*}}void [[T1:@__omp_offloading_.+CheckSimple.+]]_worker()
15#pragma omp target
16 {
17 // Entry point.
18 // CHECK: define {{.*}}void [[T1]]()
19 // Alloca in entry block.
20 // CHECK: [[BUF:%[a-zA-Z0-9_]+]] = alloca [[SIMPLE_PRINTF_TY]]
21
22 // CHECK: {{call|invoke}} void [[T1]]_worker()
23 // CHECK: br label {{%?}}[[EXIT:.+]]
24 //
25 // CHECK-DAG: [[CMTID:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.tid.x()
26 // CHECK-DAG: [[CMNTH:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
27 // CHECK-DAG: [[CMWS:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.warpsize()
28 // CHECK: [[IS_MASTER:%.+]] = icmp eq i32 [[CMTID]],
29 // CHECK: br i1 [[IS_MASTER]], label {{%?}}[[MASTER:.+]], label {{%?}}[[EXIT]]
30 //
31 // CHECK: [[MASTER]]
32 // CHECK-DAG: [[MNTH:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
33 // CHECK-DAG: [[MWS:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.warpsize()
Alexey Bataeve290ec02018-04-06 16:03:36 +000034 // CHECK: [[MTMP1:%.+]] = sub nuw i32 [[MNTH]], [[MWS]]
Arpith Chacko Jacobcdda3daa2017-01-29 20:49:31 +000035 // CHECK: call void @__kmpc_kernel_init(i32 [[MTMP1]]
36
37 // printf in master-only basic block.
38 // CHECK: [[FMT:%[0-9]+]] = load{{.*}}%fmt
39 const char* fmt = "%d %lld %f";
40 // CHECK: [[PTR0:%[0-9]+]] = getelementptr inbounds [[SIMPLE_PRINTF_TY]], [[SIMPLE_PRINTF_TY]]* [[BUF]], i32 0, i32 0
41 // CHECK: store i32 1, i32* [[PTR0]], align 4
42 // CHECK: [[PTR1:%[0-9]+]] = getelementptr inbounds [[SIMPLE_PRINTF_TY]], [[SIMPLE_PRINTF_TY]]* [[BUF]], i32 0, i32 1
43 // CHECK: store i64 2, i64* [[PTR1]], align 8
44 // CHECK: [[PTR2:%[0-9]+]] = getelementptr inbounds [[SIMPLE_PRINTF_TY]], [[SIMPLE_PRINTF_TY]]* [[BUF]], i32 0, i32 2
45
46 // CHECK: store double 3.0{{[^,]*}}, double* [[PTR2]], align 8
47 // CHECK: [[BUF_CAST:%[0-9]+]] = bitcast [[SIMPLE_PRINTF_TY]]* [[BUF]] to i8*
48 // CHECK: [[RET:%[0-9]+]] = call i32 @vprintf(i8* [[FMT]], i8* [[BUF_CAST]])
49 printf(fmt, 1, 2ll, 3.0);
50 }
51
52 return 0;
53}
54
55void CheckNoArgs() {
56 // CHECK: define {{.*}}void [[T2:@__omp_offloading_.+CheckNoArgs.+]]_worker()
57#pragma omp target
58 {
59 // Entry point.
60 // CHECK: define {{.*}}void [[T2]]()
61
62 // CHECK: {{call|invoke}} void [[T2]]_worker()
63 // CHECK: br label {{%?}}[[EXIT:.+]]
64 //
65 // CHECK-DAG: [[CMTID:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.tid.x()
66 // CHECK-DAG: [[CMNTH:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
67 // CHECK-DAG: [[CMWS:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.warpsize()
68 // CHECK: [[IS_MASTER:%.+]] = icmp eq i32 [[CMTID]],
69 // CHECK: br i1 [[IS_MASTER]], label {{%?}}[[MASTER:.+]], label {{%?}}[[EXIT]]
70 //
71 // CHECK: [[MASTER]]
72 // CHECK-DAG: [[MNTH:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
73 // CHECK-DAG: [[MWS:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.warpsize()
Alexey Bataeve290ec02018-04-06 16:03:36 +000074 // CHECK: [[MTMP1:%.+]] = sub nuw i32 [[MNTH]], [[MWS]]
Arpith Chacko Jacobcdda3daa2017-01-29 20:49:31 +000075 // CHECK: call void @__kmpc_kernel_init(i32 [[MTMP1]]
76
77 // printf in master-only basic block.
78 // CHECK: call i32 @vprintf({{.*}}, i8* null){{$}}
79 printf("hello, world!");
80 }
81}
82
83// Check that printf's alloca happens in the entry block, not inside the if
84// statement.
85int foo;
86void CheckAllocaIsInEntryBlock() {
87 // CHECK: define {{.*}}void [[T3:@__omp_offloading_.+CheckAllocaIsInEntryBlock.+]]_worker()
88#pragma omp target
89 {
90 // Entry point.
91 // CHECK: define {{.*}}void [[T3]](
92 // Alloca in entry block.
93 // CHECK: alloca %printf_args
94
95 // CHECK: {{call|invoke}} void [[T3]]_worker()
96 // CHECK: br label {{%?}}[[EXIT:.+]]
97 //
98 // CHECK-DAG: [[CMTID:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.tid.x()
99 // CHECK-DAG: [[CMNTH:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
100 // CHECK-DAG: [[CMWS:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.warpsize()
101 // CHECK: [[IS_MASTER:%.+]] = icmp eq i32 [[CMTID]],
102 // CHECK: br i1 [[IS_MASTER]], label {{%?}}[[MASTER:.+]], label {{%?}}[[EXIT]]
103 //
104 // CHECK: [[MASTER]]
105 // CHECK-DAG: [[MNTH:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.ntid.x()
106 // CHECK-DAG: [[MWS:%.+]] = call i32 @llvm.nvvm.read.ptx.sreg.warpsize()
Alexey Bataeve290ec02018-04-06 16:03:36 +0000107 // CHECK: [[MTMP1:%.+]] = sub nuw i32 [[MNTH]], [[MWS]]
Arpith Chacko Jacobcdda3daa2017-01-29 20:49:31 +0000108 // CHECK: call void @__kmpc_kernel_init(i32 [[MTMP1]]
109
110 if (foo) {
111 printf("%d", 42);
112 }
113 }
114}