10b57cec5SDimitry Andric /*
20b57cec5SDimitry Andric * kmp_taskdeps.h
30b57cec5SDimitry Andric */
40b57cec5SDimitry Andric
50b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
80b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
90b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
100b57cec5SDimitry Andric //
110b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
120b57cec5SDimitry Andric
130b57cec5SDimitry Andric #ifndef KMP_TASKDEPS_H
140b57cec5SDimitry Andric #define KMP_TASKDEPS_H
150b57cec5SDimitry Andric
160b57cec5SDimitry Andric #include "kmp.h"
170b57cec5SDimitry Andric
180b57cec5SDimitry Andric #define KMP_ACQUIRE_DEPNODE(gtid, n) __kmp_acquire_lock(&(n)->dn.lock, (gtid))
190b57cec5SDimitry Andric #define KMP_RELEASE_DEPNODE(gtid, n) __kmp_release_lock(&(n)->dn.lock, (gtid))
200b57cec5SDimitry Andric
__kmp_node_deref(kmp_info_t * thread,kmp_depnode_t * node)210b57cec5SDimitry Andric static inline void __kmp_node_deref(kmp_info_t *thread, kmp_depnode_t *node) {
220b57cec5SDimitry Andric if (!node)
230b57cec5SDimitry Andric return;
240b57cec5SDimitry Andric
250b57cec5SDimitry Andric kmp_int32 n = KMP_ATOMIC_DEC(&node->dn.nrefs) - 1;
266e75b2fbSDimitry Andric KMP_DEBUG_ASSERT(n >= 0);
270b57cec5SDimitry Andric if (n == 0) {
2881ad6265SDimitry Andric #if USE_ITT_BUILD && USE_ITT_NOTIFY
2981ad6265SDimitry Andric __itt_sync_destroy(node);
3081ad6265SDimitry Andric #endif
310b57cec5SDimitry Andric KMP_ASSERT(node->dn.nrefs == 0);
320b57cec5SDimitry Andric #if USE_FAST_MEMORY
330b57cec5SDimitry Andric __kmp_fast_free(thread, node);
340b57cec5SDimitry Andric #else
350b57cec5SDimitry Andric __kmp_thread_free(thread, node);
360b57cec5SDimitry Andric #endif
370b57cec5SDimitry Andric }
380b57cec5SDimitry Andric }
390b57cec5SDimitry Andric
__kmp_depnode_list_free(kmp_info_t * thread,kmp_depnode_list * list)400b57cec5SDimitry Andric static inline void __kmp_depnode_list_free(kmp_info_t *thread,
410b57cec5SDimitry Andric kmp_depnode_list *list) {
420b57cec5SDimitry Andric kmp_depnode_list *next;
430b57cec5SDimitry Andric
440b57cec5SDimitry Andric for (; list; list = next) {
450b57cec5SDimitry Andric next = list->next;
460b57cec5SDimitry Andric
470b57cec5SDimitry Andric __kmp_node_deref(thread, list->node);
480b57cec5SDimitry Andric #if USE_FAST_MEMORY
490b57cec5SDimitry Andric __kmp_fast_free(thread, list);
500b57cec5SDimitry Andric #else
510b57cec5SDimitry Andric __kmp_thread_free(thread, list);
520b57cec5SDimitry Andric #endif
530b57cec5SDimitry Andric }
540b57cec5SDimitry Andric }
550b57cec5SDimitry Andric
__kmp_dephash_free_entries(kmp_info_t * thread,kmp_dephash_t * h)560b57cec5SDimitry Andric static inline void __kmp_dephash_free_entries(kmp_info_t *thread,
570b57cec5SDimitry Andric kmp_dephash_t *h) {
580b57cec5SDimitry Andric for (size_t i = 0; i < h->size; i++) {
590b57cec5SDimitry Andric if (h->buckets[i]) {
600b57cec5SDimitry Andric kmp_dephash_entry_t *next;
610b57cec5SDimitry Andric for (kmp_dephash_entry_t *entry = h->buckets[i]; entry; entry = next) {
620b57cec5SDimitry Andric next = entry->next_in_bucket;
63fe6060f1SDimitry Andric __kmp_depnode_list_free(thread, entry->last_set);
64fe6060f1SDimitry Andric __kmp_depnode_list_free(thread, entry->prev_set);
650b57cec5SDimitry Andric __kmp_node_deref(thread, entry->last_out);
660b57cec5SDimitry Andric if (entry->mtx_lock) {
670b57cec5SDimitry Andric __kmp_destroy_lock(entry->mtx_lock);
680b57cec5SDimitry Andric __kmp_free(entry->mtx_lock);
690b57cec5SDimitry Andric }
700b57cec5SDimitry Andric #if USE_FAST_MEMORY
710b57cec5SDimitry Andric __kmp_fast_free(thread, entry);
720b57cec5SDimitry Andric #else
730b57cec5SDimitry Andric __kmp_thread_free(thread, entry);
740b57cec5SDimitry Andric #endif
750b57cec5SDimitry Andric }
760b57cec5SDimitry Andric h->buckets[i] = 0;
770b57cec5SDimitry Andric }
780b57cec5SDimitry Andric }
79349cc55cSDimitry Andric __kmp_node_deref(thread, h->last_all);
80349cc55cSDimitry Andric h->last_all = NULL;
810b57cec5SDimitry Andric }
820b57cec5SDimitry Andric
__kmp_dephash_free(kmp_info_t * thread,kmp_dephash_t * h)830b57cec5SDimitry Andric static inline void __kmp_dephash_free(kmp_info_t *thread, kmp_dephash_t *h) {
840b57cec5SDimitry Andric __kmp_dephash_free_entries(thread, h);
850b57cec5SDimitry Andric #if USE_FAST_MEMORY
860b57cec5SDimitry Andric __kmp_fast_free(thread, h);
870b57cec5SDimitry Andric #else
880b57cec5SDimitry Andric __kmp_thread_free(thread, h);
890b57cec5SDimitry Andric #endif
900b57cec5SDimitry Andric }
910b57cec5SDimitry Andric
92fe6060f1SDimitry Andric extern void __kmpc_give_task(kmp_task_t *ptask, kmp_int32 start);
93fe6060f1SDimitry Andric
__kmp_release_deps(kmp_int32 gtid,kmp_taskdata_t * task)940b57cec5SDimitry Andric static inline void __kmp_release_deps(kmp_int32 gtid, kmp_taskdata_t *task) {
95*06c3fb27SDimitry Andric
96*06c3fb27SDimitry Andric #if OMPX_TASKGRAPH
97*06c3fb27SDimitry Andric if (task->is_taskgraph && !(__kmp_tdg_is_recording(task->tdg->tdg_status))) {
98*06c3fb27SDimitry Andric kmp_node_info_t *TaskInfo = &(task->tdg->record_map[task->td_task_id]);
99*06c3fb27SDimitry Andric
100*06c3fb27SDimitry Andric for (int i = 0; i < TaskInfo->nsuccessors; i++) {
101*06c3fb27SDimitry Andric kmp_int32 successorNumber = TaskInfo->successors[i];
102*06c3fb27SDimitry Andric kmp_node_info_t *successor = &(task->tdg->record_map[successorNumber]);
103*06c3fb27SDimitry Andric kmp_int32 npredecessors = KMP_ATOMIC_DEC(&successor->npredecessors_counter) - 1;
104*06c3fb27SDimitry Andric if (successor->task != nullptr && npredecessors == 0) {
105*06c3fb27SDimitry Andric __kmp_omp_task(gtid, successor->task, false);
106*06c3fb27SDimitry Andric }
107*06c3fb27SDimitry Andric }
108*06c3fb27SDimitry Andric return;
109*06c3fb27SDimitry Andric }
110*06c3fb27SDimitry Andric #endif
111*06c3fb27SDimitry Andric
1120b57cec5SDimitry Andric kmp_info_t *thread = __kmp_threads[gtid];
1130b57cec5SDimitry Andric kmp_depnode_t *node = task->td_depnode;
1140b57cec5SDimitry Andric
115e8d8bef9SDimitry Andric // Check mutexinoutset dependencies, release locks
116e8d8bef9SDimitry Andric if (UNLIKELY(node && (node->dn.mtx_num_locks < 0))) {
117e8d8bef9SDimitry Andric // negative num_locks means all locks were acquired
118e8d8bef9SDimitry Andric node->dn.mtx_num_locks = -node->dn.mtx_num_locks;
119e8d8bef9SDimitry Andric for (int i = node->dn.mtx_num_locks - 1; i >= 0; --i) {
120e8d8bef9SDimitry Andric KMP_DEBUG_ASSERT(node->dn.mtx_locks[i] != NULL);
121e8d8bef9SDimitry Andric __kmp_release_lock(node->dn.mtx_locks[i], gtid);
122e8d8bef9SDimitry Andric }
123e8d8bef9SDimitry Andric }
124e8d8bef9SDimitry Andric
1250b57cec5SDimitry Andric if (task->td_dephash) {
1260b57cec5SDimitry Andric KA_TRACE(
1270b57cec5SDimitry Andric 40, ("__kmp_release_deps: T#%d freeing dependencies hash of task %p.\n",
1280b57cec5SDimitry Andric gtid, task));
1290b57cec5SDimitry Andric __kmp_dephash_free(thread, task->td_dephash);
1300b57cec5SDimitry Andric task->td_dephash = NULL;
1310b57cec5SDimitry Andric }
1320b57cec5SDimitry Andric
1330b57cec5SDimitry Andric if (!node)
1340b57cec5SDimitry Andric return;
1350b57cec5SDimitry Andric
1360b57cec5SDimitry Andric KA_TRACE(20, ("__kmp_release_deps: T#%d notifying successors of task %p.\n",
1370b57cec5SDimitry Andric gtid, task));
1380b57cec5SDimitry Andric
1390b57cec5SDimitry Andric KMP_ACQUIRE_DEPNODE(gtid, node);
140*06c3fb27SDimitry Andric #if OMPX_TASKGRAPH
141*06c3fb27SDimitry Andric if (!task->is_taskgraph ||
142*06c3fb27SDimitry Andric (task->is_taskgraph && !__kmp_tdg_is_recording(task->tdg->tdg_status)))
143*06c3fb27SDimitry Andric #endif
1440b57cec5SDimitry Andric node->dn.task =
1450b57cec5SDimitry Andric NULL; // mark this task as finished, so no new dependencies are generated
1460b57cec5SDimitry Andric KMP_RELEASE_DEPNODE(gtid, node);
1470b57cec5SDimitry Andric
1480b57cec5SDimitry Andric kmp_depnode_list_t *next;
149e8d8bef9SDimitry Andric kmp_taskdata_t *next_taskdata;
1500b57cec5SDimitry Andric for (kmp_depnode_list_t *p = node->dn.successors; p; p = next) {
1510b57cec5SDimitry Andric kmp_depnode_t *successor = p->node;
15281ad6265SDimitry Andric #if USE_ITT_BUILD && USE_ITT_NOTIFY
15381ad6265SDimitry Andric __itt_sync_releasing(successor);
15481ad6265SDimitry Andric #endif
1550b57cec5SDimitry Andric kmp_int32 npredecessors = KMP_ATOMIC_DEC(&successor->dn.npredecessors) - 1;
1560b57cec5SDimitry Andric
1570b57cec5SDimitry Andric // successor task can be NULL for wait_depends or because deps are still
1580b57cec5SDimitry Andric // being processed
1590b57cec5SDimitry Andric if (npredecessors == 0) {
16081ad6265SDimitry Andric #if USE_ITT_BUILD && USE_ITT_NOTIFY
16181ad6265SDimitry Andric __itt_sync_acquired(successor);
16281ad6265SDimitry Andric #endif
1630b57cec5SDimitry Andric KMP_MB();
1640b57cec5SDimitry Andric if (successor->dn.task) {
1650b57cec5SDimitry Andric KA_TRACE(20, ("__kmp_release_deps: T#%d successor %p of %p scheduled "
1660b57cec5SDimitry Andric "for execution.\n",
1670b57cec5SDimitry Andric gtid, successor->dn.task, task));
168e8d8bef9SDimitry Andric // If a regular task depending on a hidden helper task, when the
169e8d8bef9SDimitry Andric // hidden helper task is done, the regular task should be executed by
170e8d8bef9SDimitry Andric // its encountering team.
171e8d8bef9SDimitry Andric if (KMP_HIDDEN_HELPER_THREAD(gtid)) {
172e8d8bef9SDimitry Andric // Hidden helper thread can only execute hidden helper tasks
173e8d8bef9SDimitry Andric KMP_ASSERT(task->td_flags.hidden_helper);
174e8d8bef9SDimitry Andric next_taskdata = KMP_TASK_TO_TASKDATA(successor->dn.task);
175e8d8bef9SDimitry Andric // If the dependent task is a regular task, we need to push to its
176e8d8bef9SDimitry Andric // encountering thread's queue; otherwise, it can be pushed to its own
177e8d8bef9SDimitry Andric // queue.
178e8d8bef9SDimitry Andric if (!next_taskdata->td_flags.hidden_helper) {
179349cc55cSDimitry Andric kmp_int32 encountering_gtid =
180349cc55cSDimitry Andric next_taskdata->td_alloc_thread->th.th_info.ds.ds_gtid;
181349cc55cSDimitry Andric kmp_int32 encountering_tid = __kmp_tid_from_gtid(encountering_gtid);
182349cc55cSDimitry Andric __kmpc_give_task(successor->dn.task, encountering_tid);
183e8d8bef9SDimitry Andric } else {
1840b57cec5SDimitry Andric __kmp_omp_task(gtid, successor->dn.task, false);
1850b57cec5SDimitry Andric }
186e8d8bef9SDimitry Andric } else {
187e8d8bef9SDimitry Andric __kmp_omp_task(gtid, successor->dn.task, false);
188e8d8bef9SDimitry Andric }
189e8d8bef9SDimitry Andric }
1900b57cec5SDimitry Andric }
1910b57cec5SDimitry Andric
1920b57cec5SDimitry Andric next = p->next;
1930b57cec5SDimitry Andric __kmp_node_deref(thread, p->node);
1940b57cec5SDimitry Andric #if USE_FAST_MEMORY
1950b57cec5SDimitry Andric __kmp_fast_free(thread, p);
1960b57cec5SDimitry Andric #else
1970b57cec5SDimitry Andric __kmp_thread_free(thread, p);
1980b57cec5SDimitry Andric #endif
1990b57cec5SDimitry Andric }
2000b57cec5SDimitry Andric
2010b57cec5SDimitry Andric __kmp_node_deref(thread, node);
2020b57cec5SDimitry Andric
2030b57cec5SDimitry Andric KA_TRACE(
2040b57cec5SDimitry Andric 20,
2050b57cec5SDimitry Andric ("__kmp_release_deps: T#%d all successors of %p notified of completion\n",
2060b57cec5SDimitry Andric gtid, task));
2070b57cec5SDimitry Andric }
2080b57cec5SDimitry Andric
2090b57cec5SDimitry Andric #endif // KMP_TASKDEPS_H
210