xref: /llvm-project/clang/test/OpenMP/taskloop_codegen.cpp (revision 7a2037151c2976b5ca6677a559fc3777066e746a)
1 // RUN: %clang_cc1 -verify -triple x86_64-apple-darwin10 -fopenmp -x c++ -emit-llvm %s -o - -femit-all-decls | FileCheck %s
2 // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -emit-pch -o %t %s
3 // RUN: %clang_cc1 -fopenmp -x c++ -triple x86_64-apple-darwin10 -include-pch %t -verify %s -emit-llvm -o - -femit-all-decls | FileCheck %s
4 // expected-no-diagnostics
5 #ifndef HEADER
6 #define HEADER
7 
8 // CHECK-LABEL: @main
9 int main(int argc, char **argv) {
10 // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%ident_t* [[DEFLOC:@.+]])
11 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%ident_t* [[DEFLOC]], i32 [[GTID]], i32 33, i64 72, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK1:@.+]] to i32 (i32, i8*)*))
12 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
13 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
14 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
15 // CHECK: store i64 0, i64* [[DOWN]],
16 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
17 // CHECK: store i64 9, i64* [[UP]],
18 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
19 // CHECK: store i64 1, i64* [[ST]],
20 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
21 // CHECK: call void @__kmpc_taskloop(%ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 0, i32 0, i64 0, i8* null)
22 #pragma omp taskloop priority(argc)
23   for (int i = 0; i < 10; ++i)
24     ;
25 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 72, i64 1, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK2:@.+]] to i32 (i32, i8*)*))
26 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
27 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
28 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
29 // CHECK: store i64 0, i64* [[DOWN]],
30 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
31 // CHECK: store i64 9, i64* [[UP]],
32 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
33 // CHECK: store i64 1, i64* [[ST]],
34 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
35 // CHECK: [[GRAINSIZE:%.+]] = zext i32 %{{.+}} to i64
36 // CHECK: call void @__kmpc_taskloop(%ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 1, i32 1, i64 [[GRAINSIZE]], i8* null)
37 #pragma omp taskloop nogroup grainsize(argc)
38   for (int i = 0; i < 10; ++i)
39     ;
40 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 72, i64 24, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK3:@.+]] to i32 (i32, i8*)*))
41 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
42 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
43 // CHECK: [[IF:%.+]] = icmp ne i32 %{{.+}}, 0
44 // CHECK: [[IF_INT:%.+]] = sext i1 [[IF]] to i32
45 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
46 // CHECK: store i64 0, i64* [[DOWN]],
47 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
48 // CHECK: store i64 %{{.+}}, i64* [[UP]],
49 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
50 // CHECK: store i64 1, i64* [[ST]],
51 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
52 // CHECK: call void @__kmpc_taskloop(%ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 [[IF_INT]], i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 0, i32 2, i64 4, i8* null)
53   int i;
54 #pragma omp taskloop if(argc) shared(argc, argv) collapse(2) num_tasks(4)
55   for (i = 0; i < argc; ++i)
56   for (int j = argc; j < argv[argc][argc]; ++j)
57     ;
58 }
59 
60 // CHECK: define internal i32 [[TASK1]](
61 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
62 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
63 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
64 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
65 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
66 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
67 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
68 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
69 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
70 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
71 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
72 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
73 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
74 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
75 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
76 // CHECK: br label
77 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
78 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
79 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
80 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
81 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
82 // CHECK: load i32, i32* %
83 // CHECK: store i32 %
84 // CHECK: load i32, i32* %
85 // CHECK: add nsw i32 %{{.+}}, 1
86 // CHECK: store i32 %{{.+}}, i32* %
87 // CHECK: br label %
88 // CHECK: ret i32 0
89 
90 // CHECK: define internal i32 [[TASK2]](
91 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
92 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
93 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
94 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
95 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
96 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
97 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
98 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
99 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
100 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
101 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
102 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
103 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
104 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
105 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
106 // CHECK: br label
107 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
108 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
109 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
110 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
111 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
112 // CHECK: load i32, i32* %
113 // CHECK: store i32 %
114 // CHECK: load i32, i32* %
115 // CHECK: add nsw i32 %{{.+}}, 1
116 // CHECK: store i32 %{{.+}}, i32* %
117 // CHECK: br label %
118 // CHECK: ret i32 0
119 
120 // CHECK: define internal i32 [[TASK3]](
121 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
122 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
123 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
124 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
125 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
126 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
127 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
128 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
129 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
130 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
131 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
132 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
133 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
134 // CHECK: store i64 [[LB_VAL]], i64* [[CNT:%.+]],
135 // CHECK: br label
136 // CHECK: ret i32 0
137 
138 // CHECK-LABEL: @_ZN1SC2Ei
139 struct S {
140   int a;
141   S(int c) {
142 // CHECK: [[GTID:%.+]] = call i32 @__kmpc_global_thread_num(%ident_t* [[DEFLOC:@.+]])
143 // CHECK: [[TASKV:%.+]] = call i8* @__kmpc_omp_task_alloc(%ident_t* [[DEFLOC]], i32 [[GTID]], i32 1, i64 72, i64 16, i32 (i32, i8*)* bitcast (i32 (i32, [[TDP_TY:%.+]]*)* [[TASK4:@.+]] to i32 (i32, i8*)*))
144 // CHECK: [[TASK:%.+]] = bitcast i8* [[TASKV]] to [[TDP_TY]]*
145 // CHECK: [[TASK_DATA:%.+]] = getelementptr inbounds [[TDP_TY]], [[TDP_TY]]* [[TASK]], i32 0, i32 0
146 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 5
147 // CHECK: store i64 0, i64* [[DOWN]],
148 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 6
149 // CHECK: store i64 %{{.+}}, i64* [[UP]],
150 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* [[TASK_DATA]], i32 0, i32 7
151 // CHECK: store i64 1, i64* [[ST]],
152 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
153 // CHECK: [[NUM_TASKS:%.+]] = zext i32 %{{.+}} to i64
154 // CHECK: call void @__kmpc_taskloop(%ident_t* [[DEFLOC]], i32 [[GTID]], i8* [[TASKV]], i32 1, i64* [[DOWN]], i64* [[UP]], i64 [[ST_VAL]], i32 0, i32 2, i64 [[NUM_TASKS]], i8* null)
155 #pragma omp taskloop shared(c) num_tasks(a)
156     for (a = 0; a < c; ++a)
157       ;
158   }
159 } s(1);
160 
161 // CHECK: define internal i32 [[TASK4]](
162 // CHECK: [[DOWN:%.+]] = getelementptr inbounds [[TD_TY:%.+]], [[TD_TY]]* %{{.+}}, i32 0, i32 5
163 // CHECK: [[DOWN_VAL:%.+]] = load i64, i64* [[DOWN]],
164 // CHECK: [[UP:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 6
165 // CHECK: [[UP_VAL:%.+]] = load i64, i64* [[UP]],
166 // CHECK: [[ST:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 7
167 // CHECK: [[ST_VAL:%.+]] = load i64, i64* [[ST]],
168 // CHECK: [[LITER:%.+]] = getelementptr inbounds [[TD_TY]], [[TD_TY]]* %{{.+}}, i32 0, i32 8
169 // CHECK: [[LITER_VAL:%.+]] = load i32, i32* [[LITER]],
170 // CHECK: store i64 [[DOWN_VAL]], i64* [[LB:%[^,]+]],
171 // CHECK: store i64 [[UP_VAL]], i64* [[UB:%[^,]+]],
172 // CHECK: store i64 [[ST_VAL]], i64* [[ST:%[^,]+]],
173 // CHECK: store i32 [[LITER_VAL]], i32* [[LITER:%[^,]+]],
174 // CHECK: [[LB_VAL:%.+]] = load i64, i64* [[LB]],
175 // CHECK: [[LB_I32:%.+]] = trunc i64 [[LB_VAL]] to i32
176 // CHECK: store i32 [[LB_I32]], i32* [[CNT:%.+]],
177 // CHECK: br label
178 // CHECK: [[VAL:%.+]] = load i32, i32* [[CNT]],
179 // CHECK: [[VAL_I64:%.+]] = sext i32 [[VAL]] to i64
180 // CHECK: [[UB_VAL:%.+]] = load i64, i64* [[UB]],
181 // CHECK: [[CMP:%.+]] = icmp ule i64 [[VAL_I64]], [[UB_VAL]]
182 // CHECK: br i1 [[CMP]], label %{{.+}}, label %{{.+}}
183 // CHECK: load i32, i32* %
184 // CHECK: store i32 %
185 // CHECK: load i32, i32* %
186 // CHECK: add nsw i32 %{{.+}}, 1
187 // CHECK: store i32 %{{.+}}, i32* %
188 // CHECK: br label %
189 // CHECK: ret i32 0
190 
191 #endif
192