1 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -fopenmp-version=45 -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck %s --check-prefix CHECK --check-prefix OMP45 2 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s 3 // RUN: %clang_cc1 -fopenmp -fopenmp-version=45 -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck %s --check-prefix CHECK --check-prefix OMP45 4 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -fopenmp-version=50 -x c++ -emit-llvm %s -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50 5 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s 6 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s --check-prefix CHECK --check-prefix OMP50 7 8 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp-simd -fopenmp-version=45 -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s 9 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s 10 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=45 -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s 11 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp-simd -fopenmp-version=50 -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s 12 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s 13 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck --check-prefix SIMD-ONLY0 %s 14 // SIMD-ONLY0-NOT: {{__kmpc|__tgt}} 15 // expected-no-diagnostics 16 #ifndef HEADER 17 #define HEADER 18 19 // CHECK-LABEL: @main 20 int main(int argc, char **argv) { 21 // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]]) 22 // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 23 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 33, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK1:@.+]] to i32 (i32, i8*)*)) 24 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 25 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 26 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 27 // CHECK: store i64 0, i64* [[DOWN]], 28 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 29 // CHECK: store i64 9, i64* [[UP]], 30 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 31 // CHECK: store i64 1, i64* [[ST]], 32 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 33 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 0, i64 0, i8* null) 34 // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 35 #pragma omp taskloop simd priority(argc) 36 for (int i = 0; i < 10; ++i) 37 ; 38 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK2:@.+]] to i32 (i32, i8*)*)) 39 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 40 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 41 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 42 // CHECK: store i64 0, i64* [[DOWN]], 43 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 44 // CHECK: store i64 9, i64* [[UP]], 45 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 46 // CHECK: store i64 1, i64* [[ST]], 47 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 48 // CHECK: [[GRAINSIZE:%.+]] = zext i32 %{{.+}} to i64 49 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 1, i64 [[GRAINSIZE]], i8* null) 50 #pragma omp taskloop simd nogroup grainsize(argc) simdlen(4) 51 for (int i = 0; i < 10; ++i) 52 ; 53 // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 54 // OMP45: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK3:@.+]] to i32 (i32, i8*)*)) 55 // OMP50: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 24, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK3:@.+]] to i32 (i32, i8*)*)) 56 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 57 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 58 // OMP45: [[IF:%.+]] = icmp ne i32 %{{.+}}, 0 59 // OMP50: [[IF_VAL:%.+]] = load i8, i8* % 60 // OMP50: [[IF:%.+]] = trunc i8 [[IF_VAL]] to i1 61 // CHECK: [[IF_INT:%.+]] = sext i1 [[IF]] to i32 62 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 63 // CHECK: store i64 0, i64* [[DOWN]], 64 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 65 // CHECK: store i64 %{{.+}}, i64* [[UP]], 66 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 67 // CHECK: store i64 1, i64* [[ST]], 68 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 69 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 [[IF_INT]], i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 4, i8* null) 70 // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 71 int i; 72 #pragma omp taskloop simd if(argc) shared(argc, argv) collapse(2) num_tasks(4) safelen(32) 73 for (i = 0; i < argc; ++i) 74 for (int j = argc; j < argv[argc][argc]; ++j) 75 ; 76 } 77 78 // CHECK: define internal i32 [[TASK1]]( 79 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 80 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 81 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 82 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 83 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 84 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 85 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 86 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 87 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 88 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 89 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 90 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 91 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 92 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32 93 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]], 94 // CHECK: br label 95 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],{{.*}}!llvm.access.group 96 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64 97 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],{{.*}}!llvm.access.group 98 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]] 99 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}} 100 // CHECK: load i32, i32* %{{.*}}!llvm.access.group 101 // CHECK: store i32 %{{.*}}!llvm.access.group 102 // CHECK: load i32, i32* %{{.*}}!llvm.access.group 103 // CHECK: add nsw i32 %{{.+}}, 1 104 // CHECK: store i32 %{{.+}}, i32* %{{.*}}!llvm.access.group 105 // CHECK: br label %{{.*}}!llvm.loop 106 // CHECK: ret i32 0 107 108 // CHECK: define internal i32 [[TASK2]]( 109 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 110 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 111 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 112 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 113 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 114 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 115 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 116 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 117 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 118 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 119 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 120 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 121 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 122 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32 123 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]], 124 // CHECK: br label 125 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],{{.*}}!llvm.access.group 126 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64 127 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],{{.*}}!llvm.access.group 128 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]] 129 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}} 130 // CHECK: load i32, i32* %{{.*}}!llvm.access.group 131 // CHECK: store i32 %{{.*}}!llvm.access.group 132 // CHECK: load i32, i32* %{{.*}}!llvm.access.group 133 // CHECK: add nsw i32 %{{.+}}, 1 134 // CHECK: store i32 %{{.+}}, i32* %{{.*}}!llvm.access.group 135 // CHECK: br label %{{.*}}!llvm.loop 136 // CHECK: ret i32 0 137 138 // CHECK: define internal i32 [[TASK3]]( 139 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 140 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 141 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 142 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 143 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 144 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 145 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 146 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 147 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 148 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 149 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 150 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 151 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 152 // CHECK: store i64 [[LB_VAL]], i64* [[CNT:%.+]], 153 // CHECK: br label 154 // CHECK-NOT: !llvm.access.group 155 // CHECK: br label %{{.*}}!llvm.loop 156 // CHECK: ret i32 0 157 158 // CHECK-LABEL: @_ZN1SC2Ei 159 struct S { 160 int a; 161 S(int c) { 162 // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]]) 163 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK4:@.+]] to i32 (i32, i8*)*)) 164 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 165 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 166 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 167 // CHECK: store i64 0, i64* [[DOWN]], 168 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 169 // CHECK: store i64 %{{.+}}, i64* [[UP]], 170 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 171 // CHECK: store i64 1, i64* [[ST]], 172 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 173 // CHECK: [[NUM_TASKS:%.+]] = zext i32 %{{.+}} to i64 174 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 [[NUM_TASKS]], i8* null) 175 #pragma omp taskloop simd shared(c) num_tasks(a) simdlen(8) safelen(64) 176 for (a = 0; a < c; ++a) 177 ; 178 } 179 } s(1); 180 181 // CHECK: define internal i32 [[TASK4]]( 182 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 183 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 184 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 185 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 186 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 187 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 188 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 189 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 190 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 191 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 192 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 193 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 194 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 195 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32 196 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]], 197 // CHECK: br label 198 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]], 199 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64 200 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]], 201 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]] 202 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}} 203 // CHECK: load i32, i32* % 204 // CHECK-NOT: !llvm.access.group 205 // CHECK: store i32 % 206 // CHECK-NOT: !llvm.access.group 207 // CHECK: load i32, i32* % 208 // CHECK-NOT: !llvm.access.group 209 // CHECK: add nsw i32 %{{.+}}, 1 210 // CHECK: store i32 %{{.+}}, i32* % 211 // CHECK-NOT: !llvm.access.group 212 // CHECK: br label %{{.*}}!llvm.loop 213 // CHECK: ret i32 0 214 215 // CHECK: !{!"llvm.loop.vectorize.enable", i1 true} 216 // CHECK: !{!"llvm.loop.vectorize.width", i32 4} 217 // CHECK: !{!"llvm.loop.vectorize.width", i32 32} 218 // CHECK: !{!"llvm.loop.vectorize.width", i32 8} 219 220 #endif 221