xref: /llvm-project/openmp/runtime/test/ompt/parallel/nested_lwt_thread_num.c (revision f41d08540be21f852b7ee6293953f66f5a1123b6)
1*f41d0854SVladimir Inđić // RUN: %libomp-compile-and-run | FileCheck %s
2*f41d0854SVladimir Inđić // REQUIRES: ompt
3*f41d0854SVladimir Inđić 
4*f41d0854SVladimir Inđić #include "callback.h"
5*f41d0854SVladimir Inđić #include <omp.h>
6*f41d0854SVladimir Inđić 
7*f41d0854SVladimir Inđić 
8*f41d0854SVladimir Inđić __attribute__ ((noinline)) // workaround for bug in icc
print_task_info_at(int ancestor_level,int id)9*f41d0854SVladimir Inđić void print_task_info_at(int ancestor_level, int id)
10*f41d0854SVladimir Inđić {
11*f41d0854SVladimir Inđić #pragma omp critical
12*f41d0854SVladimir Inđić   {
13*f41d0854SVladimir Inđić     int task_type;
14*f41d0854SVladimir Inđić     char buffer[2048];
15*f41d0854SVladimir Inđić     ompt_data_t *parallel_data;
16*f41d0854SVladimir Inđić     ompt_data_t *task_data;
17*f41d0854SVladimir Inđić     int thread_num;
18*f41d0854SVladimir Inđić     ompt_get_task_info(ancestor_level, &task_type, &task_data, NULL,
19*f41d0854SVladimir Inđić                        &parallel_data, &thread_num);
20*f41d0854SVladimir Inđić     format_task_type(task_type, buffer);
21*f41d0854SVladimir Inđić     printf("%" PRIu64 ": ancestor_level=%d id=%d task_type=%s=%d "
22*f41d0854SVladimir Inđić                       "parallel_id=%" PRIu64 " task_id=%" PRIu64
23*f41d0854SVladimir Inđić                       " thread_num=%d\n",
24*f41d0854SVladimir Inđić         ompt_get_thread_data()->value, ancestor_level, id, buffer,
25*f41d0854SVladimir Inđić         task_type, parallel_data->value, task_data->value, thread_num);
26*f41d0854SVladimir Inđić   }
27*f41d0854SVladimir Inđić };
28*f41d0854SVladimir Inđić 
29*f41d0854SVladimir Inđić __attribute__ ((noinline)) // workaround for bug in icc
print_innermost_task_info(int id)30*f41d0854SVladimir Inđić void print_innermost_task_info(int id)
31*f41d0854SVladimir Inđić {
32*f41d0854SVladimir Inđić   print_task_info_at(0, id);
33*f41d0854SVladimir Inđić }
34*f41d0854SVladimir Inđić 
35*f41d0854SVladimir Inđić 
main()36*f41d0854SVladimir Inđić int main()
37*f41d0854SVladimir Inđić {
38*f41d0854SVladimir Inđić 
39*f41d0854SVladimir Inđić #pragma omp parallel num_threads(2)
40*f41d0854SVladimir Inđić   {
41*f41d0854SVladimir Inđić     // sync threads before checking the output
42*f41d0854SVladimir Inđić #pragma omp barrier
43*f41d0854SVladimir Inđić     // region 0
44*f41d0854SVladimir Inđić     if (omp_get_thread_num() == 1) {
45*f41d0854SVladimir Inđić       // executed by worker thread only
46*f41d0854SVladimir Inđić       // assert that thread_num is 1
47*f41d0854SVladimir Inđić       print_innermost_task_info(1);
48*f41d0854SVladimir Inđić 
49*f41d0854SVladimir Inđić #pragma omp parallel num_threads(1)
50*f41d0854SVladimir Inđić       {
51*f41d0854SVladimir Inđić         // serialized region 1
52*f41d0854SVladimir Inđić         // assert that thread_num is 0
53*f41d0854SVladimir Inđić         print_innermost_task_info(2);
54*f41d0854SVladimir Inđić 
55*f41d0854SVladimir Inđić #pragma omp parallel num_threads(1)
56*f41d0854SVladimir Inđić         {
57*f41d0854SVladimir Inđić           // serialized region 2
58*f41d0854SVladimir Inđić           // assert that thread_num is 0
59*f41d0854SVladimir Inđić           print_innermost_task_info(3);
60*f41d0854SVladimir Inđić 
61*f41d0854SVladimir Inđić           // Check the value of thread_num while iterating over the hierarchy
62*f41d0854SVladimir Inđić           // of active tasks.
63*f41d0854SVladimir Inđić           print_task_info_at(0, 3);
64*f41d0854SVladimir Inđić           print_task_info_at(1, 2);
65*f41d0854SVladimir Inđić           print_task_info_at(2, 1);
66*f41d0854SVladimir Inđić 
67*f41d0854SVladimir Inđić         }
68*f41d0854SVladimir Inđić 
69*f41d0854SVladimir Inđić       }
70*f41d0854SVladimir Inđić     }
71*f41d0854SVladimir Inđić   }
72*f41d0854SVladimir Inđić 
73*f41d0854SVladimir Inđić 
74*f41d0854SVladimir Inđić   // Check if libomp supports the callbacks for this test.
75*f41d0854SVladimir Inđić   // CHECK-NOT: {{^}}0: Could not register callback 'ompt_callback_task_create'
76*f41d0854SVladimir Inđić   // CHECK-NOT: {{^}}0: Could not register callback 'ompt_callback_implicit_task'
77*f41d0854SVladimir Inđić 
78*f41d0854SVladimir Inđić 
79*f41d0854SVladimir Inđić   // CHECK: {{^}}0: NULL_POINTER=[[NULL:.*$]]
80*f41d0854SVladimir Inđić   // CHECK: {{^}}[[MASTER_ID:[0-9]+]]: ompt_event_initial_task_begin: parallel_id=[[PARALLEL_ID_0:[0-9]+]], task_id=[[TASK_ID_0:[0-9]+]], actual_parallelism=1, index=1, flags=1
81*f41d0854SVladimir Inđić 
82*f41d0854SVladimir Inđić   // region 0
83*f41d0854SVladimir Inđić   // CHECK: {{^}}[[MASTER_ID]]: ompt_event_parallel_begin: parent_task_id=[[TASK_ID_0]],
84*f41d0854SVladimir Inđić   // CHECK-SAME: parallel_id=[[PARALLEL_ID_1:[0-9]+]]
85*f41d0854SVladimir Inđić   // CHECK-DAG: {{^}}[[MASTER_ID]]: ompt_event_implicit_task_begin: parallel_id=[[PARALLEL_ID_1]], task_id=[[TASK_ID_1:[0-9]+]]
86*f41d0854SVladimir Inđić   // CHECK-DAG: {{^}}[[WORKER_ID:[0-9]+]]: ompt_event_implicit_task_begin: parallel_id=[[PARALLEL_ID_1]], task_id=[[TASK_ID_2:[0-9]+]]
87*f41d0854SVladimir Inđić   // assert some info about implicit task executed by worker thread
88*f41d0854SVladimir Inđić   // thread_num is the most important
89*f41d0854SVladimir Inđić   // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=0 id=1
90*f41d0854SVladimir Inđić   // CHECK-SAME: parallel_id=[[PARALLEL_ID_1]] task_id=[[TASK_ID_2]]
91*f41d0854SVladimir Inđić   // CHECK-SAME: thread_num=1
92*f41d0854SVladimir Inđić 
93*f41d0854SVladimir Inđić   // serialized region 1
94*f41d0854SVladimir Inđić   // CHECK: {{^}}[[WORKER_ID]]: ompt_event_parallel_begin: parent_task_id=[[TASK_ID_2]],
95*f41d0854SVladimir Inđić   // CHECK-SAME: parallel_id=[[PARALLEL_ID_2:[0-9]+]]
96*f41d0854SVladimir Inđić   // CHECK-DAG: {{^}}[[WORKER_ID]]: ompt_event_implicit_task_begin: parallel_id=[[PARALLEL_ID_2]], task_id=[[TASK_ID_3:[0-9]+]]
97*f41d0854SVladimir Inđić   // assert some information about the implicit task of the serialized region 1
98*f41d0854SVladimir Inđić   // pay attention that thread_num should take value 0
99*f41d0854SVladimir Inđić   // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=0 id=2
100*f41d0854SVladimir Inđić   // CHECK-SAME: parallel_id=[[PARALLEL_ID_2]] task_id=[[TASK_ID_3]]
101*f41d0854SVladimir Inđić   // CHECK-SAME: thread_num=0
102*f41d0854SVladimir Inđić 
103*f41d0854SVladimir Inđić   // serialized region 2
104*f41d0854SVladimir Inđić   // CHECK: {{^}}[[WORKER_ID]]: ompt_event_parallel_begin: parent_task_id=[[TASK_ID_3]],
105*f41d0854SVladimir Inđić   // CHECK-SAME: parallel_id=[[PARALLEL_ID_3:[0-9]+]]
106*f41d0854SVladimir Inđić   // CHECK-DAG: {{^}}[[WORKER_ID]]: ompt_event_implicit_task_begin: parallel_id=[[PARALLEL_ID_3]], task_id=[[TASK_ID_4:[0-9]+]]
107*f41d0854SVladimir Inđić   // assert some information about the implicit task of the serialized region 2
108*f41d0854SVladimir Inđić   // pay attention that thread_num should take value 0
109*f41d0854SVladimir Inđić   // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=0 id=3
110*f41d0854SVladimir Inđić   // CHECK-SAME: parallel_id=[[PARALLEL_ID_3]] task_id=[[TASK_ID_4]]
111*f41d0854SVladimir Inđić   // CHECK-SAME: thread_num=0
112*f41d0854SVladimir Inđić 
113*f41d0854SVladimir Inđić   // Check the value of thread_num argument while iterating over the hierarchy
114*f41d0854SVladimir Inđić   // of active tasks. The expected is that thread_num takes the value checked
115*f41d0854SVladimir Inđić   // above in the test case (0, 0, 1 - respectively).
116*f41d0854SVladimir Inđić 
117*f41d0854SVladimir Inđić   // Thread is the master thread of the region 2, so thread_num should be 0.
118*f41d0854SVladimir Inđić   // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=0 id=3
119*f41d0854SVladimir Inđić   // CHECK-SAME: parallel_id=[[PARALLEL_ID_3]] task_id=[[TASK_ID_4]]
120*f41d0854SVladimir Inđić   // CHECK-SAME: thread_num=0
121*f41d0854SVladimir Inđić 
122*f41d0854SVladimir Inđić   // Thread is the master thread of the region 1, so thread_num should be 0.
123*f41d0854SVladimir Inđić   // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=1 id=2
124*f41d0854SVladimir Inđić   // CHECK-SAME: parallel_id=[[PARALLEL_ID_2]] task_id=[[TASK_ID_3]]
125*f41d0854SVladimir Inđić   // CHECK-SAME: thread_num=0
126*f41d0854SVladimir Inđić 
127*f41d0854SVladimir Inđić   // Thread is the worker thread of the region 0, so thread_num should be 1.
128*f41d0854SVladimir Inđić   // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=2 id=1
129*f41d0854SVladimir Inđić   // CHECK-SAME: parallel_id=[[PARALLEL_ID_1]] task_id=[[TASK_ID_2]]
130*f41d0854SVladimir Inđić   // CHECK-SAME: thread_num=1
131*f41d0854SVladimir Inđić 
132*f41d0854SVladimir Inđić   return 0;
133*f41d0854SVladimir Inđić }
134