Samuel Antao | 4be30e9 | 2015-10-02 17:14:03 +0000 | [diff] [blame^] | 1 | // RUN: %clang_cc1 -verify -fopenmp -x c++ -triple powerpc64le-unknown-unknown -emit-llvm %s -o - | FileCheck %s |
| 2 | // RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple powerpc64le-unknown-unknown -emit-pch -o %t %s |
| 3 | // RUN: %clang_cc1 -fopenmp -x c++ -triple powerpc64le-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s |
| 4 | // RUN: %clang_cc1 -verify -fopenmp -x c++ -triple i386-unknown-unknown -emit-llvm %s -o - | FileCheck %s |
| 5 | // RUN: %clang_cc1 -fopenmp -x c++ -std=c++11 -triple i386-unknown-unknown -emit-pch -o %t %s |
| 6 | // RUN: %clang_cc1 -fopenmp -x c++ -triple i386-unknown-unknown -std=c++11 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s |
| 7 | // expected-no-diagnostics |
| 8 | #ifndef HEADER |
| 9 | #define HEADER |
| 10 | |
| 11 | |
| 12 | // CHECK-DAG: [[GA:@.+]] = global double 1.000000e+00 |
| 13 | // CHECK-DAG: [[GB:@.+]] = global double 2.000000e+00 |
| 14 | // CHECK-DAG: [[GC:@.+]] = global double 3.000000e+00 |
| 15 | // CHECK-DAG: [[GD:@.+]] = global double 4.000000e+00 |
| 16 | // CHECK-DAG: [[FA:@.+]] = internal global float 5.000000e+00 |
| 17 | // CHECK-DAG: [[FB:@.+]] = internal global float 6.000000e+00 |
| 18 | // CHECK-DAG: [[FC:@.+]] = internal global float 7.000000e+00 |
| 19 | // CHECK-DAG: [[FD:@.+]] = internal global float 8.000000e+00 |
| 20 | // CHECK-DAG: [[BA:@.+]] = internal global float 9.000000e+00 |
| 21 | // CHECK-DAG: [[BB:@.+]] = internal global float 1.000000e+01 |
| 22 | // CHECK-DAG: [[BC:@.+]] = internal global float 1.100000e+01 |
| 23 | // CHECK-DAG: [[BD:@.+]] = internal global float 1.200000e+01 |
| 24 | double Ga = 1.0; |
| 25 | double Gb = 2.0; |
| 26 | double Gc = 3.0; |
| 27 | double Gd = 4.0; |
| 28 | |
| 29 | // CHECK: define {{.*}} @{{.*}}foo{{.*}}( |
| 30 | // CHECK-SAME: i16 {{[^,]*}}[[A:%[^,]+]], |
| 31 | // CHECK-SAME: i16 {{[^,]*}}[[B:%[^,]+]], |
| 32 | // CHECK-SAME: i16 {{[^,]*}}[[C:%[^,]+]], |
| 33 | // CHECK-SAME: i16 {{[^,]*}}[[D:%[^,]+]]) |
| 34 | // CHECK: [[LA:%.+]] = alloca i16 |
| 35 | // CHECK: [[LB:%.+]] = alloca i16 |
| 36 | // CHECK: [[LC:%.+]] = alloca i16 |
| 37 | // CHECK: [[LD:%.+]] = alloca i16 |
| 38 | int foo(short a, short b, short c, short d){ |
| 39 | static float Sa = 5.0; |
| 40 | static float Sb = 6.0; |
| 41 | static float Sc = 7.0; |
| 42 | static float Sd = 8.0; |
| 43 | |
| 44 | // CHECK-DAG: [[REFB:%.+]] = bitcast i16* [[LB]] to i8* |
| 45 | // CHECK-DAG: store i8* [[REFB]], i8** [[GEPB:%.+]], align |
| 46 | // CHECK-DAG: [[REFC:%.+]] = bitcast i16* [[LC]] to i8* |
| 47 | // CHECK-DAG: store i8* [[REFC]], i8** [[GEPC:%.+]], align |
| 48 | // CHECK-DAG: [[REFD:%.+]] = bitcast i16* [[LD]] to i8* |
| 49 | // CHECK-DAG: store i8* [[REFD]], i8** [[GEPD:%.+]], align |
| 50 | // CHECK-DAG: store i8* bitcast (double* [[GB]] to i8*), i8** [[GEPGB:%.+]], align |
| 51 | // CHECK-DAG: store i8* bitcast (double* [[GC]] to i8*), i8** [[GEPGC:%.+]], align |
| 52 | // CHECK-DAG: store i8* bitcast (double* [[GD]] to i8*), i8** [[GEPGD:%.+]], align |
| 53 | // CHECK-DAG: store i8* bitcast (float* [[FB]] to i8*), i8** [[GEPFB:%.+]], align |
| 54 | // CHECK-DAG: store i8* bitcast (float* [[FC]] to i8*), i8** [[GEPFC:%.+]], align |
| 55 | // CHECK-DAG: store i8* bitcast (float* [[FD]] to i8*), i8** [[GEPFD:%.+]], align |
| 56 | // CHECK-DAG: [[GEPB]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 57 | // CHECK-DAG: [[GEPC]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 58 | // CHECK-DAG: [[GEPD]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 59 | // CHECK-DAG: [[GEPGB]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 60 | // CHECK-DAG: [[GEPGC]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 61 | // CHECK-DAG: [[GEPGD]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 62 | // CHECK-DAG: [[GEPFB]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 63 | // CHECK-DAG: [[GEPFC]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 64 | // CHECK-DAG: [[GEPFD]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 65 | // CHECK: call i32 @__tgt_target |
| 66 | // CHECK: call void [[OFFLOADF:@.+]]( |
| 67 | // Capture b, Gb, Sb, Gc, c, Sc, d, Gd, Sd |
| 68 | #pragma omp target if(Ga>0.0 && a>0 && Sa>0.0) |
| 69 | { |
| 70 | b += 1; |
| 71 | Gb += 1.0; |
| 72 | Sb += 1.0; |
| 73 | |
| 74 | // CHECK: define internal void [[OFFLOADF]]({{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}) |
| 75 | // The parallel region only uses 3 captures. |
| 76 | // CHECK: call {{.*}}@__kmpc_fork_call(%ident_t* {{.+}}, i32 {{.+}}, void (i32*, i32*, ...)* bitcast ({{.*}}[[PARF:@.+]] to {{.*}}), {{.+}}* %{{.+}}, {{.+}}* %{{.+}}, {{.+}}* %{{.+}}) |
| 77 | // CHECK: call void @.omp_outlined.(i32* %{{.+}}, i32* %{{.+}}, {{.+}}* %{{.+}}, {{.+}}* %{{.+}}, {{.+}}* %{{.+}}) |
| 78 | // Capture d, Gd, Sd, |
| 79 | |
| 80 | // CHECK: define internal void [[PARF]](i32* noalias %{{.*}}, i32* noalias %{{.*}}, |
| 81 | #pragma omp parallel if(Gc>0.0 && c>0 && Sc>0.0) |
| 82 | { |
| 83 | d += 1; |
| 84 | Gd += 1.0; |
| 85 | Sd += 1.0; |
| 86 | } |
| 87 | } |
| 88 | return a + b + c + d + (int)Sa + (int)Sb + (int)Sc + (int)Sd; |
| 89 | } |
| 90 | |
| 91 | // CHECK: define {{.*}} @{{.*}}bar{{.*}}( |
| 92 | // CHECK-SAME: i16 {{[^,]*}}[[A:%[^,]+]], |
| 93 | // CHECK-SAME: i16 {{[^,]*}}[[B:%[^,]+]], |
| 94 | // CHECK-SAME: i16 {{[^,]*}}[[C:%[^,]+]], |
| 95 | // CHECK-SAME: i16 {{[^,]*}}[[D:%[^,]+]]) |
| 96 | // CHECK: [[LA:%.+]] = alloca i16 |
| 97 | // CHECK: [[LB:%.+]] = alloca i16 |
| 98 | // CHECK: [[LC:%.+]] = alloca i16 |
| 99 | // CHECK: [[LD:%.+]] = alloca i16 |
| 100 | int bar(short a, short b, short c, short d){ |
| 101 | static float Sa = 9.0; |
| 102 | static float Sb = 10.0; |
| 103 | static float Sc = 11.0; |
| 104 | static float Sd = 12.0; |
| 105 | |
| 106 | // CHECK: call void {{.*}}@__kmpc_fork_call(%ident_t* {{.+}}, i32 {{.+}}, void (i32*, i32*, ...)* bitcast ({{.*}}[[PARF:@.+]] to {{.*}}), i16* %{{.+}}, i16* %{{.+}}, i16* %{{.+}}, i16* %{{.+}}) |
| 107 | // CHECK: define internal void [[PARF]](i32* noalias %{{.*}}, i32* noalias %{{.*}}, i16* dereferenceable(2) [[A:%.+]], i16* dereferenceable(2) [[B:%.+]], i16* dereferenceable(2) [[C:%.+]], i16* dereferenceable(2) [[D:%.+]]) |
| 108 | // Capture a, b, c, d |
| 109 | #pragma omp parallel |
| 110 | { |
| 111 | // CHECK: [[ADRA:%.+]] = alloca i16*, align |
| 112 | // CHECK: [[ADRB:%.+]] = alloca i16*, align |
| 113 | // CHECK: [[ADRC:%.+]] = alloca i16*, align |
| 114 | // CHECK: [[ADRD:%.+]] = alloca i16*, align |
| 115 | // CHECK: store i16* [[A]], i16** [[ADRA]], align |
| 116 | // CHECK: store i16* [[B]], i16** [[ADRB]], align |
| 117 | // CHECK: store i16* [[C]], i16** [[ADRC]], align |
| 118 | // CHECK: store i16* [[D]], i16** [[ADRD]], align |
| 119 | // CHECK: [[REFA:%.+]] = load i16*, i16** [[ADRA]], |
| 120 | // CHECK: [[REFB:%.+]] = load i16*, i16** [[ADRB]], |
| 121 | // CHECK: [[REFC:%.+]] = load i16*, i16** [[ADRC]], |
| 122 | // CHECK: [[REFD:%.+]] = load i16*, i16** [[ADRD]], |
| 123 | |
| 124 | // CHECK: load float, float* [[BA]] |
| 125 | |
| 126 | // CHECK-DAG: [[CSTB:%.+]] = bitcast i16* [[REFB]] to i8* |
| 127 | // CHECK-DAG: [[CSTC:%.+]] = bitcast i16* [[REFC]] to i8* |
| 128 | // CHECK-DAG: [[CSTD:%.+]] = bitcast i16* [[REFD]] to i8* |
| 129 | // CHECK-DAG: store i8* [[CSTB]], i8** [[GEPB:%.+]], align |
| 130 | // CHECK-DAG: store i8* [[CSTC]], i8** [[GEPC:%.+]], align |
| 131 | // CHECK-DAG: store i8* [[CSTD]], i8** [[GEPD:%.+]], align |
| 132 | // CHECK-DAG: store i8* bitcast (double* [[GB]] to i8*), i8** [[GEPGB:%.+]], align |
| 133 | // CHECK-DAG: store i8* bitcast (double* [[GC]] to i8*), i8** [[GEPGC:%.+]], align |
| 134 | // CHECK-DAG: store i8* bitcast (double* [[GD]] to i8*), i8** [[GEPGD:%.+]], align |
| 135 | // CHECK-DAG: store i8* bitcast (float* [[BB]] to i8*), i8** [[GEPBB:%.+]], align |
| 136 | // CHECK-DAG: store i8* bitcast (float* [[BC]] to i8*), i8** [[GEPBC:%.+]], align |
| 137 | // CHECK-DAG: store i8* bitcast (float* [[BD]] to i8*), i8** [[GEPBD:%.+]], align |
| 138 | |
| 139 | // CHECK-DAG: [[GEPB]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 140 | // CHECK-DAG: [[GEPC]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 141 | // CHECK-DAG: [[GEPD]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 142 | // CHECK-DAG: [[GEPGB]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 143 | // CHECK-DAG: [[GEPGC]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 144 | // CHECK-DAG: [[GEPGD]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 145 | // CHECK-DAG: [[GEPBB]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 146 | // CHECK-DAG: [[GEPBC]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 147 | // CHECK-DAG: [[GEPBD]] = getelementptr inbounds [9 x i8*], [9 x i8*]* %{{.+}}, i32 0, i32 {{.+}} |
| 148 | // CHECK: call i32 @__tgt_target |
| 149 | // CHECK: call void [[OFFLOADF:@.+]]( |
| 150 | // Capture b, Gb, Sb, Gc, c, Sc, d, Gd, Sd |
| 151 | #pragma omp target if(Ga>0.0 && a>0 && Sa>0.0) |
| 152 | { |
| 153 | b += 1; |
| 154 | Gb += 1.0; |
| 155 | Sb += 1.0; |
| 156 | |
| 157 | // CHECK: define internal void [[OFFLOADF]]({{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}, {{.+}}* {{.*}}%{{.+}}) |
| 158 | // CHECK: call void {{.*}}@__kmpc_fork_call(%ident_t* {{.+}}, i32 {{.+}}, void (i32*, i32*, ...)* bitcast ({{.*}}[[PARF:@.+]] to {{.*}}) |
| 159 | |
| 160 | // CHECK: define internal void [[PARF]](i32* noalias %{{.*}}, i32* noalias %{{.*}}, {{.+}}* dereferenceable({{.+}}) %{{.+}}, {{.+}}* dereferenceable({{.+}}) %{{.+}}, {{.+}}* dereferenceable({{.+}}) %{{.+}}) |
| 161 | // Capture d, Gd, Sd |
| 162 | #pragma omp parallel if(Gc>0.0 && c>0 && Sc>0.0) |
| 163 | { |
| 164 | d += 1; |
| 165 | Gd += 1.0; |
| 166 | Sd += 1.0; |
| 167 | } |
| 168 | } |
| 169 | } |
| 170 | return a + b + c + d + (int)Sa + (int)Sb + (int)Sc + (int)Sd; |
| 171 | } |
| 172 | |
| 173 | #endif |