1 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -fopenmp-version=50 -x c++ -emit-llvm %s -o - | FileCheck %s 2 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s 3 // RUN: %clang_cc1 -fopenmp -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - | FileCheck %s 4 5 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp-simd -fopenmp-version=50 -x c++ -emit-llvm %s -o - | FileCheck --check-prefix SIMD-ONLY0 %s 6 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s 7 // RUN: %clang_cc1 -fopenmp-simd -fopenmp-version=50 -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - | FileCheck --check-prefix SIMD-ONLY0 %s 8 // SIMD-ONLY0-NOT: {{__kmpc|__tgt}} 9 // expected-no-diagnostics 10 #ifndef HEADER 11 #define HEADER 12 13 // CHECK-LABEL: @main 14 int main(int argc, char **argv) { 15 // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]]) 16 // CHECK: call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], 17 // CHECK: call i32 @__kmpc_omp_task(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], 18 #pragma omp task 19 ; 20 // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 21 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 33, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK1:@.+]] to i32 (i32, i8*)*)) 22 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 23 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 24 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 25 // CHECK: store i64 0, i64* [[DOWN]], 26 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 27 // CHECK: store i64 9, i64* [[UP]], 28 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 29 // CHECK: store i64 1, i64* [[ST]], 30 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 31 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 0, i64 0, i8* null) 32 // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 33 #pragma omp taskloop priority(argc) 34 for (int i = 0; i < 10; ++i) 35 ; 36 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK2:@.+]] to i32 (i32, i8*)*)) 37 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 38 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 39 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 40 // CHECK: store i64 0, i64* [[DOWN]], 41 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 42 // CHECK: store i64 9, i64* [[UP]], 43 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 44 // CHECK: store i64 1, i64* [[ST]], 45 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 46 // CHECK: [[GRAINSIZE:%.+]] = zext i32 %{{.+}} to i64 47 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 1, i64 [[GRAINSIZE]], i8* null) 48 #pragma omp taskloop nogroup grainsize(argc) 49 for (int i = 0; i < 10; ++i) 50 ; 51 // CHECK: call void @__kmpc_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 52 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK3:@.+]] to i32 (i32, i8*)*)) 53 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 54 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 55 // CHECK: [[IF:%.+]] = icmp ne i32 %{{.+}}, 0 56 // CHECK: [[IF_INT:%.+]] = sext i1 [[IF]] to i32 57 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 58 // CHECK: store i64 0, i64* [[DOWN]], 59 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 60 // CHECK: store i64 %{{.+}}, i64* [[UP]], 61 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 62 // CHECK: store i64 1, i64* [[ST]], 63 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 64 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 [[IF_INT]], i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 4, i8* null) 65 // CHECK: call void @__kmpc_end_taskgroup(%struct.ident_t* [[DEFLOC]], i32 [[GTID]]) 66 int i; 67 #pragma omp taskloop if(argc) shared(argc, argv) collapse(2) num_tasks(4) 68 for (i = 0; i < argc; ++i) 69 for (int j = argc; j < argv[argc][argc]; ++j) 70 ; 71 // CHECK: call void @__kmpc_taskgroup( 72 // CHECK: call i8* @__kmpc_omp_task_alloc(%struct.ident_t* @{{.+}}, i32 %{{.+}}, i32 1, i64 80, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, %{{.+}}*)* [[TASK_CANCEL:@.+]] to i32 (i32, i8*)*)) 73 // CHECK: call void @__kmpc_taskloop( 74 // CHECK: call void @__kmpc_end_taskgroup( 75 #pragma omp taskloop 76 for (int i = 0; i < 10; ++i) { 77 #pragma omp cancel taskgroup 78 #pragma omp cancellation point taskgroup 79 } 80 } 81 82 // CHECK: define internal i32 [[TASK1]]( 83 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 84 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 85 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 86 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 87 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 88 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 89 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 90 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 91 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 92 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 93 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 94 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 95 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 96 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32 97 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]], 98 // CHECK: br label 99 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]], 100 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64 101 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]], 102 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]] 103 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}} 104 // CHECK: load i32, i32* % 105 // CHECK: store i32 % 106 // CHECK: load i32, i32* % 107 // CHECK: add nsw i32 %{{.+}}, 1 108 // CHECK: store i32 %{{.+}}, i32* % 109 // CHECK: br label % 110 // CHECK: ret i32 0 111 112 // CHECK: define internal i32 [[TASK2]]( 113 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 114 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 115 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 116 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 117 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 118 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 119 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 120 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 121 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 122 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 123 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 124 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 125 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 126 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32 127 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]], 128 // CHECK: br label 129 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]], 130 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64 131 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]], 132 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]] 133 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}} 134 // CHECK: load i32, i32* % 135 // CHECK: store i32 % 136 // CHECK: load i32, i32* % 137 // CHECK: add nsw i32 %{{.+}}, 1 138 // CHECK: store i32 %{{.+}}, i32* % 139 // CHECK: br label % 140 // CHECK: ret i32 0 141 142 // CHECK: define internal i32 [[TASK3]]( 143 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 144 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 145 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 146 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 147 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 148 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 149 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 150 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 151 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 152 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 153 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 154 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 155 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 156 // CHECK: store i64 [[LB_VAL]], i64* [[CNT:%.+]], 157 // CHECK: br label 158 // CHECK: ret i32 0 159 160 // CHECK: define internal i32 [[TASK_CANCEL]]( 161 // CHECK: [[RES:%.+]] = call i32 @__kmpc_cancel(%struct.ident_t* @{{.+}}, i32 %{{.+}}, i32 4) 162 // CHECK: [[IS_CANCEL:%.+]] = icmp ne i32 [[RES]], 0 163 // CHECK: br i1 [[IS_CANCEL]], label %[[EXIT:.+]], label %[[CONTINUE:[^,]+]] 164 // CHECK: [[EXIT]]: 165 // CHECK: store i32 1, i32* [[CLEANUP_SLOT:%.+]], 166 // CHECK: br label %[[DONE:[^,]+]] 167 // CHECK: [[CONTINUE]]: 168 // CHECK: [[RES:%.+]] = call i32 @__kmpc_cancellationpoint(%struct.ident_t* @{{.+}}, i32 %{{.+}}, i32 4) 169 // CHECK: [[IS_CANCEL:%.+]] = icmp ne i32 [[RES]], 0 170 // CHECK: br i1 [[IS_CANCEL]], label %[[EXIT2:.+]], label %[[CONTINUE2:[^,]+]] 171 // CHECK: [[EXIT2]]: 172 // CHECK: store i32 1, i32* [[CLEANUP_SLOT]], 173 // CHECK: br label %[[DONE]] 174 // CHECK: store i32 0, i32* [[CLEANUP_SLOT]], 175 // CHECK: br label %[[DONE]] 176 // CHECK: [[DONE]]: 177 // CHECK: ret i32 0 178 179 // CHECK-LABEL: @_ZN1SC2Ei 180 struct S { 181 int a; 182 S(int c) { 183 // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* [[DEFLOC:@.+]]) 184 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 80, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK4:@.+]] to i32 (i32, i8*)*)) 185 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]* 186 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0 187 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5 188 // CHECK: store i64 0, i64* [[DOWN]], 189 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6 190 // CHECK: store i64 %{{.+}}, i64* [[UP]], 191 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7 192 // CHECK: store i64 1, i64* [[ST]], 193 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 194 // CHECK: [[NUM_TASKS:%.+]] = zext i32 %{{.+}} to i64 195 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 2, i64 [[NUM_TASKS]], i8* null) 196 #pragma omp taskloop shared(c) num_tasks(a) 197 for (a = 0; a < c; ++a) 198 ; 199 } 200 } s(1); 201 202 // CHECK: define internal i32 [[TASK4]]( 203 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5 204 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]], 205 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6 206 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]], 207 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7 208 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]], 209 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8 210 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]], 211 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]], 212 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]], 213 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]], 214 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]], 215 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]], 216 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32 217 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]], 218 // CHECK: br label 219 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]], 220 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64 221 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]], 222 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]] 223 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}} 224 // CHECK: load i32, i32* % 225 // CHECK: store i32 % 226 // CHECK: load i32, i32* % 227 // CHECK: add nsw i32 %{{.+}}, 1 228 // CHECK: store i32 %{{.+}}, i32* % 229 // CHECK: br label % 230 // CHECK: ret i32 0 231 232 class St { 233 public: 234 operator int(); 235 St &operator+=(int); 236 }; 237 238 // CHECK-LABEL: taskloop_with_class 239 void taskloop_with_class() { 240 St s1; 241 // CHECK: [[TD:%.+]] = call i8* @__kmpc_omp_task_alloc(%struct.ident_t* @{{.+}}, i32 [[GTID:%.+]], i32 1, i64 88, i64 8, i32 (i32, i8*)* bitcast (i32 (i32, [[TD_TYPE:%.+]]*)* @{{.+}} to i32 (i32, i8*)*)) 242 // CHECK: call void @__kmpc_taskloop(%struct.ident_t* @{{.+}}, i32 [[GTID]], i8* [[TD]], i32 1, i64* %{{.+}}, i64* %{{.+}}, i64 %{{.+}}, i32 1, i32 0, i64 0, i8* bitcast (void ([[TD_TYPE]]*, [[TD_TYPE]]*, i32)* @{{.+}} to i8*)) 243 #pragma omp taskloop 244 for (St s = St(); s < s1; s += 1) { 245 } 246 } 247 248 #endif 249